File size: 2,244 Bytes
57cf043
c7266d8
 
57cf043
 
 
 
c7266d8
57cf043
 
 
 
 
 
c7266d8
57cf043
 
 
 
 
 
 
 
 
 
29769f8
57cf043
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
c7266d8
 
 
57cf043
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
common:
  log_file_path: !ENV ${LOG_FILE_PATH:/data/logs/common.log}
  log_sql_path: !ENV ${SQLALCHEMY_DATABASE_URL:sqlite:////data/logs.db}

bd:
  faiss:
    model_embedding_path: !ENV ${EMBEDDING_MODEL_PATH:intfloat/multilingual-e5-large}
    path_to_metadata: !ENV ${PATH_TO_METADATA:/data/regulation_datasets}
    device: !ENV ${FAISS_DEVICE:cuda}

  elastic:
    use_elastic: False
    es_host: !ENV ${ELASTIC_HOST:localhost}
    es_port: !ENV ${ELASTIC_PORT:9200}
    people_path: /data/person_card

  ranging:
    use_ranging: false
    alpha: 0.35
    beta: -0.15
    k_neighbors: 100

  search:
    vector_search:
      use_vector_search: true
      k_neighbors: 100

    people_elastic_search:
      use_people_search: false
      index_name: 'people_search'
      k_neighbors: 10

    chunks_elastic_search:
      use_chunks_search: true
      index_name: 'nmd_full_text'
      k_neighbors: 5

    groups_elastic_search:
      use_groups_search: false
      index_name: 'group_search_elastic_nn'
      k_neighbors: 1

    rocks_nn_elastic_search:
      use_rocks_nn_search: false
      index_name: 'rocks_nn_search_elastic'
      k_neighbors: 1

    segmentation_elastic_search:
      use_segmentation_search: false
      index_name: 'segmentation_search_elastic'
      k_neighbors: 1

    # Если поиск будет не по чанкам, то добавить название ключа из функции search_answer словаря answer!!!
    stop_index_names: ['people_answer', 'groups_answer', 'rocks_nn_answer', 'segmentation_answer']

    abbreviation_search:
      use_abbreviation_search: true
      index_name: 'nmd_abbreviation_elastic'
      k_neighbors: 10

  files:
    empty_start: true
    regulations_path: /data/regulation_datasets
    default_regulations_path: /data/regulation_datasets/default
    documents_path: /data/documents

llm:
  base_url: !ENV ${LLM_BASE_URL:https://api.deepinfra.com}
  api_key_env: !ENV ${API_KEY_ENV:DEEPINFRA_API_KEY}
  model: !ENV ${MODEL_NAME:meta-llama/Llama-3.3-70B-Instruct-Turbo}
  tokenizer_name: !ENV ${TOKENIZER_NAME:unsloth/Llama-3.3-70B-Instruct}
  temperature: 0.14
  top_p: 0.95
  min_p: 0.05
  frequency_penalty: -0.001
  presence_penalty: 1.3
  seed: 42