daiqi commited on
Commit
f6375de
·
verified ·
1 Parent(s): 157969e

Update commit_results.jsonl

Browse files
Files changed (1) hide show
  1. commit_results.jsonl +0 -3
commit_results.jsonl CHANGED
@@ -177,6 +177,3 @@
177
  {"Score": 47.4, "Name": "MageBench", "BaseModel": "Random Baseline", "Env.": "Sokoban", "Target-research": "Model-Eval-Global", "Subset": "all", "Link": "xxx", "State": "Checked"}
178
  {"Score": 47.4, "Name": "MageBench", "BaseModel": "Random Baseline", "Env.": "Sokoban", "Target-research": "Model-Eval-Online", "Subset": "all", "Link": "xxx", "State": "Checked"}
179
  {"Score": 16.64, "Name": "MageBench", "BaseModel": "Random Baseline", "Env.": "Football", "Target-research": "Model-Eval-Online", "Subset": "all", "Link": "xxx", "State": "Checked"}
180
- {"Score": "3.22", "Name": "testing", "BaseModel": "testing", "Env": "Sokoban", "Target-research": "Model-Eval-Online", "Subset": "mini", "Link": "testing", "State": "Checking"}
181
- {"Score": "3.22", "Name": "testing", "BaseModel": "testing", "Env": "Football", "Target-research": "Agent-Eval-Prompt", "Subset": "all", "Link": "testing", "State": "Checking"}
182
- {"Score": "3.22", "Name": "testing", "BaseModel": "testing", "Env": "WebUI", "Target-research": "Agent-Eval-Finetune", "Subset": "all", "Link": "testing", "State": "Checking"}
 
177
  {"Score": 47.4, "Name": "MageBench", "BaseModel": "Random Baseline", "Env.": "Sokoban", "Target-research": "Model-Eval-Global", "Subset": "all", "Link": "xxx", "State": "Checked"}
178
  {"Score": 47.4, "Name": "MageBench", "BaseModel": "Random Baseline", "Env.": "Sokoban", "Target-research": "Model-Eval-Online", "Subset": "all", "Link": "xxx", "State": "Checked"}
179
  {"Score": 16.64, "Name": "MageBench", "BaseModel": "Random Baseline", "Env.": "Football", "Target-research": "Model-Eval-Online", "Subset": "all", "Link": "xxx", "State": "Checked"}