Spaces:

yourbench
/

demo

Running on CPU Upgrade

sumuks HF Staff commited on Apr 2

Commit

afbd2d5

verified ·

1 Parent(s): da80f69

add llama 8b to models to evaluate as a baseline

Files changed (1) hide show

backend/tasks/evaluation_task.py CHANGED Viewed

@@ -319,7 +319,7 @@ TASKS_TABLE = [yourbench]
         models = [
             "Qwen/QwQ-32B",
             "Qwen/Qwen2.5-72B-Instruct",
-            "google/gemma-3-27b-it",
             "meta-llama/Llama-3.3-70B-Instruct",
             "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
             "mistralai/Mistral-Small-24B-Instruct-2501",

         models = [
             "Qwen/QwQ-32B",
             "Qwen/Qwen2.5-72B-Instruct",
+            "meta-llama/Llama-3.1-8B-Instruct",
             "meta-llama/Llama-3.3-70B-Instruct",
             "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
             "mistralai/Mistral-Small-24B-Instruct-2501",