KingZack commited on
Commit
23f9974
·
1 Parent(s): 6532466

adding vectorization variables to config like chunk size and model name

Browse files
Files changed (1) hide show
  1. src/ctp_slack_bot/core/config.py +9 -0
src/ctp_slack_bot/core/config.py CHANGED
@@ -13,6 +13,13 @@ class Settings(BaseSettings):
13
  API_HOST: str = "0.0.0.0"
14
  API_PORT: int = 8000
15
  DEBUG: bool = False
 
 
 
 
 
 
 
16
 
17
  # MongoDB Configuration
18
  MONGODB_URI: Optional[SecretStr] = None # TODO: Remove optionality
@@ -25,6 +32,8 @@ class Settings(BaseSettings):
25
 
26
  # Hugging Face Configuration
27
  HF_API_TOKEN: Optional[SecretStr] = None
 
 
28
 
29
  # Logging Configuration
30
  LOG_LEVEL: Literal["DEBUG", "INFO", "WARNING", "ERROR", "CRITICAL"] = "INFO"
 
13
  API_HOST: str = "0.0.0.0"
14
  API_PORT: int = 8000
15
  DEBUG: bool = False
16
+
17
+ # Vectorization Configuration
18
+ EMBEDDING_MODEL: str = "text-embedding-3-small"
19
+ VECTOR_DIMENSION: int = 1536
20
+ CHUNK_SIZE: int = 1000
21
+ CHUNK_OVERLAP: int = 200
22
+ TOP_K_MATCHES: int = 5
23
 
24
  # MongoDB Configuration
25
  MONGODB_URI: Optional[SecretStr] = None # TODO: Remove optionality
 
32
 
33
  # Hugging Face Configuration
34
  HF_API_TOKEN: Optional[SecretStr] = None
35
+
36
+
37
 
38
  # Logging Configuration
39
  LOG_LEVEL: Literal["DEBUG", "INFO", "WARNING", "ERROR", "CRITICAL"] = "INFO"