Spaces:

yourbench
/

demo

Running on CPU Upgrade

tfrere commited on Apr 7

Commit

8695aa8

1 Parent(s): c2b7f1b

normalize config file and update default benchmark model

Files changed (2) hide show

backend/config/models_config.py CHANGED Viewed

@@ -18,17 +18,22 @@ DEFAULT_EVALUATION_MODELS = [
     "mistralai/Mistral-Small-24B-Instruct-2501",
 ]
 # Required model for create_bench_config_file.py (only one default model)
-DEFAULT_MODEL = "deepseek-ai/DeepSeek-R1-Distill-Llama-70B"
 # Models by roles for benchmark configuration
 # All roles use the default model except chunking
-MODEL_ROLES = {
-    "ingestion": [DEFAULT_MODEL],
-    "summarization": [DEFAULT_MODEL],
     "chunking": ["intfloat/multilingual-e5-large-instruct"],
-    "single_shot_question_generation": [DEFAULT_MODEL],
-    "multi_hop_question_generation": [DEFAULT_MODEL],
 }
 # Default evaluation timeout (in seconds)

     "mistralai/Mistral-Small-24B-Instruct-2501",
 ]
+# "Qwen/Qwen2.5-72B-Instruct"
+# "meta-llama/Llama-3.1-8B-Instruct"
+# "Qwen/Qwen2.5-32B-Instruct",
+# "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
 # Required model for create_bench_config_file.py (only one default model)
+DEFAULT_BENCHMARK_MODEL = "Qwen/Qwen2.5-32B-Instruct"
 # Models by roles for benchmark configuration
 # All roles use the default model except chunking
+BENCHMARK_MODEL_ROLES = {
+    "ingestion": [DEFAULT_BENCHMARK_MODEL],
+    "summarization": [DEFAULT_BENCHMARK_MODEL],
     "chunking": ["intfloat/multilingual-e5-large-instruct"],
+    "single_shot_question_generation": [DEFAULT_BENCHMARK_MODEL],
+    "multi_hop_question_generation": [DEFAULT_BENCHMARK_MODEL],
 }
 # Default evaluation timeout (in seconds)

backend/tasks/create_bench_config_file.py CHANGED Viewed

@@ -15,8 +15,8 @@ from huggingface_hub import HfApi
 from tasks.get_available_model_provider import get_available_model_provider
 from config.models_config import (
-    DEFAULT_MODEL,
-    MODEL_ROLES,
     DEFAULT_BENCHMARK_TIMEOUT,
 )
@@ -124,15 +124,15 @@ class CreateBenchConfigTask:
             raise RuntimeError("HF_TOKEN environment variable is not defined")
         # Get provider for the default model
-        provider = self.get_model_provider(DEFAULT_MODEL)
         if not provider:
-            error_msg = f"Required model not available: {DEFAULT_MODEL}. Cannot proceed with benchmark."
             self._add_log(f"[ERROR] {error_msg}")
             raise RuntimeError(error_msg)
         # Create model configuration
         model_list = [{
-            "model_name": DEFAULT_MODEL,
             "provider": provider,
             "api_key": "$HF_TOKEN",
             "max_concurrent_requests": 32,
@@ -156,7 +156,7 @@ class CreateBenchConfigTask:
             },
             "model_list": model_list,
-            "model_roles": MODEL_ROLES,
             "pipeline": {
                 "ingestion": {
                     "source_documents_dir": f"uploaded_files/{self.session_uid}/uploaded_files/",

 from tasks.get_available_model_provider import get_available_model_provider
 from config.models_config import (
+    DEFAULT_BENCHMARK_MODEL,
+    BENCHMARK_MODEL_ROLES,
     DEFAULT_BENCHMARK_TIMEOUT,
 )
             raise RuntimeError("HF_TOKEN environment variable is not defined")
         # Get provider for the default model
+        provider = self.get_model_provider(DEFAULT_BENCHMARK_MODEL)
         if not provider:
+            error_msg = f"Required model not available: {DEFAULT_BENCHMARK_MODEL}. Cannot proceed with benchmark."
             self._add_log(f"[ERROR] {error_msg}")
             raise RuntimeError(error_msg)
         # Create model configuration
         model_list = [{
+            "model_name": DEFAULT_BENCHMARK_MODEL,
             "provider": provider,
             "api_key": "$HF_TOKEN",
             "max_concurrent_requests": 32,
             },
             "model_list": model_list,
+            "model_roles": BENCHMARK_MODEL_ROLES,
             "pipeline": {
                 "ingestion": {
                     "source_documents_dir": f"uploaded_files/{self.session_uid}/uploaded_files/",