Spaces:

callanwu
/

WebWalkerQALeaderboard

Running

callanwu commited on 12 days ago

Commit

b96c1c5

1 Parent(s): 3cc52f3

update

Files changed (1) hide show

deepsearch_result.jsonl CHANGED Viewed

@@ -15,5 +15,5 @@
 {"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-SFT", "model": "qwen2.5-32b-instruct", "overall": 0.615}
 {"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-RL", "model": "qwen2.5-32b-instruct", "overall": 0.630}
 {"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-RL", "model": "qwen2.5-7b-instruct", "overall": 0.556}
-{"org": "Alibaba","link": "https://github.com/Alibaba-NLP/DeepResearch", "method": "AgentFounder", "model": " qwen3-30b-a3b", "overall": 0.719}
-{"org": "Alibaba","link": "https://github.com/Alibaba-NLP/DeepResearch", "method": "Tongyi DeepResearch", "model": " qwen3-30b-a3b", "overall": 0.72.2}

 {"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-SFT", "model": "qwen2.5-32b-instruct", "overall": 0.615}
 {"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-RL", "model": "qwen2.5-32b-instruct", "overall": 0.630}
 {"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-RL", "model": "qwen2.5-7b-instruct", "overall": 0.556}
+{"org": "Alibaba","link": "https://github.com/Alibaba-NLP/DeepResearch", "method": "AgentFounder", "model": "qwen3-30b-a3b", "overall": 0.719}
+{"org": "Alibaba","link": "https://github.com/Alibaba-NLP/DeepResearch", "method": "Tongyi DeepResearch", "model": "qwen3-30b-a3b", "overall": 0.722}