Spaces:
Running
Running
update
Browse files- deepsearch_result.jsonl +2 -2
deepsearch_result.jsonl
CHANGED
@@ -15,5 +15,5 @@
|
|
15 |
{"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-SFT", "model": "qwen2.5-32b-instruct", "overall": 0.615}
|
16 |
{"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-RL", "model": "qwen2.5-32b-instruct", "overall": 0.630}
|
17 |
{"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-RL", "model": "qwen2.5-7b-instruct", "overall": 0.556}
|
18 |
-
{"org": "Alibaba","link": "https://github.com/Alibaba-NLP/DeepResearch", "method": "AgentFounder", "model": "
|
19 |
-
{"org": "Alibaba","link": "https://github.com/Alibaba-NLP/DeepResearch", "method": "Tongyi DeepResearch", "model": "
|
|
|
15 |
{"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-SFT", "model": "qwen2.5-32b-instruct", "overall": 0.615}
|
16 |
{"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-RL", "model": "qwen2.5-32b-instruct", "overall": 0.630}
|
17 |
{"org": "OPPO","link": "https://github.com/OPPO-PersonalAI/Agent_Foundation_Models","method": "AFM-RL", "model": "qwen2.5-7b-instruct", "overall": 0.556}
|
18 |
+
{"org": "Alibaba","link": "https://github.com/Alibaba-NLP/DeepResearch", "method": "AgentFounder", "model": "qwen3-30b-a3b", "overall": 0.719}
|
19 |
+
{"org": "Alibaba","link": "https://github.com/Alibaba-NLP/DeepResearch", "method": "Tongyi DeepResearch", "model": "qwen3-30b-a3b", "overall": 0.722}
|