sumuks commited on
Commit
afbd2d5
·
verified ·
1 Parent(s): da80f69

add llama 8b to models to evaluate as a baseline

Browse files
Files changed (1) hide show
  1. backend/tasks/evaluation_task.py +1 -1
backend/tasks/evaluation_task.py CHANGED
@@ -319,7 +319,7 @@ TASKS_TABLE = [yourbench]
319
  models = [
320
  "Qwen/QwQ-32B",
321
  "Qwen/Qwen2.5-72B-Instruct",
322
- "google/gemma-3-27b-it",
323
  "meta-llama/Llama-3.3-70B-Instruct",
324
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
325
  "mistralai/Mistral-Small-24B-Instruct-2501",
 
319
  models = [
320
  "Qwen/QwQ-32B",
321
  "Qwen/Qwen2.5-72B-Instruct",
322
+ "meta-llama/Llama-3.1-8B-Instruct",
323
  "meta-llama/Llama-3.3-70B-Instruct",
324
  "deepseek-ai/DeepSeek-R1-Distill-Llama-70B",
325
  "mistralai/Mistral-Small-24B-Instruct-2501",