Update README.md
Browse files
README.md
CHANGED
@@ -11,6 +11,7 @@ tags:
|
|
11 |
- Calcium
|
12 |
- Opus
|
13 |
- 14B
|
|
|
14 |
model-index:
|
15 |
- name: Calcium-Opus-14B-Elite4
|
16 |
results:
|
@@ -28,7 +29,8 @@ model-index:
|
|
28 |
value: 61.12
|
29 |
name: averaged accuracy
|
30 |
source:
|
31 |
-
url:
|
|
|
32 |
name: Open LLM Leaderboard
|
33 |
- task:
|
34 |
type: text-generation
|
@@ -44,7 +46,8 @@ model-index:
|
|
44 |
value: 45.21
|
45 |
name: normalized accuracy
|
46 |
source:
|
47 |
-
url:
|
|
|
48 |
name: Open LLM Leaderboard
|
49 |
- task:
|
50 |
type: text-generation
|
@@ -60,7 +63,8 @@ model-index:
|
|
60 |
value: 23.04
|
61 |
name: exact match
|
62 |
source:
|
63 |
-
url:
|
|
|
64 |
name: Open LLM Leaderboard
|
65 |
- task:
|
66 |
type: text-generation
|
@@ -76,7 +80,8 @@ model-index:
|
|
76 |
value: 14.09
|
77 |
name: acc_norm
|
78 |
source:
|
79 |
-
url:
|
|
|
80 |
name: Open LLM Leaderboard
|
81 |
- task:
|
82 |
type: text-generation
|
@@ -91,7 +96,8 @@ model-index:
|
|
91 |
value: 17.69
|
92 |
name: acc_norm
|
93 |
source:
|
94 |
-
url:
|
|
|
95 |
name: Open LLM Leaderboard
|
96 |
- task:
|
97 |
type: text-generation
|
@@ -108,7 +114,8 @@ model-index:
|
|
108 |
value: 46.1
|
109 |
name: accuracy
|
110 |
source:
|
111 |
-
url:
|
|
|
112 |
name: Open LLM Leaderboard
|
113 |
---
|
114 |
|
@@ -212,5 +219,4 @@ Summarized results can be found [here](https://huggingface.co/datasets/open-llm-
|
|
212 |
|MATH Lvl 5 (4-Shot)| 23.04|
|
213 |
|GPQA (0-shot) | 14.09|
|
214 |
|MuSR (0-shot) | 17.69|
|
215 |
-
|MMLU-PRO (5-shot) | 46.10|
|
216 |
-
|
|
|
11 |
- Calcium
|
12 |
- Opus
|
13 |
- 14B
|
14 |
+
- qwq
|
15 |
model-index:
|
16 |
- name: Calcium-Opus-14B-Elite4
|
17 |
results:
|
|
|
29 |
value: 61.12
|
30 |
name: averaged accuracy
|
31 |
source:
|
32 |
+
url: >-
|
33 |
+
https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
|
34 |
name: Open LLM Leaderboard
|
35 |
- task:
|
36 |
type: text-generation
|
|
|
46 |
value: 45.21
|
47 |
name: normalized accuracy
|
48 |
source:
|
49 |
+
url: >-
|
50 |
+
https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
|
51 |
name: Open LLM Leaderboard
|
52 |
- task:
|
53 |
type: text-generation
|
|
|
63 |
value: 23.04
|
64 |
name: exact match
|
65 |
source:
|
66 |
+
url: >-
|
67 |
+
https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
|
68 |
name: Open LLM Leaderboard
|
69 |
- task:
|
70 |
type: text-generation
|
|
|
80 |
value: 14.09
|
81 |
name: acc_norm
|
82 |
source:
|
83 |
+
url: >-
|
84 |
+
https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
|
85 |
name: Open LLM Leaderboard
|
86 |
- task:
|
87 |
type: text-generation
|
|
|
96 |
value: 17.69
|
97 |
name: acc_norm
|
98 |
source:
|
99 |
+
url: >-
|
100 |
+
https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
|
101 |
name: Open LLM Leaderboard
|
102 |
- task:
|
103 |
type: text-generation
|
|
|
114 |
value: 46.1
|
115 |
name: accuracy
|
116 |
source:
|
117 |
+
url: >-
|
118 |
+
https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
|
119 |
name: Open LLM Leaderboard
|
120 |
---
|
121 |
|
|
|
219 |
|MATH Lvl 5 (4-Shot)| 23.04|
|
220 |
|GPQA (0-shot) | 14.09|
|
221 |
|MuSR (0-shot) | 17.69|
|
222 |
+
|MMLU-PRO (5-shot) | 46.10|
|
|