Spaces:
Running
Running
File size: 492 Bytes
667fe9d |
1 2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 |
from pathlib import Path
DEFAULT_SEED: int = 42
MAX_TOKENIZER_FEATURES: int = 500000
CLF_MAX_ITER: int = 1000
DATASET_PATH: Path = Path("data/training.1600000.processed.noemoticon.csv")
STOPWORDS_PATH: Path = Path("data/stopwords-en.txt")
MODELS_DIR: Path = Path("models")
CACHE_DIR: Path = Path("cache")
CHECKPOINT_PATH: Path = CACHE_DIR / "pipeline.pkl"
# Create directories if they don't exist
MODELS_DIR.mkdir(parents=True, exist_ok=True)
CACHE_DIR.mkdir(parents=True, exist_ok=True)
|