prithivMLmods commited on
Commit
8e0d080
·
verified ·
1 Parent(s): 6efc174

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +14 -8
README.md CHANGED
@@ -11,6 +11,7 @@ tags:
11
  - Calcium
12
  - Opus
13
  - 14B
 
14
  model-index:
15
  - name: Calcium-Opus-14B-Elite4
16
  results:
@@ -28,7 +29,8 @@ model-index:
28
  value: 61.12
29
  name: averaged accuracy
30
  source:
31
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
 
32
  name: Open LLM Leaderboard
33
  - task:
34
  type: text-generation
@@ -44,7 +46,8 @@ model-index:
44
  value: 45.21
45
  name: normalized accuracy
46
  source:
47
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
 
48
  name: Open LLM Leaderboard
49
  - task:
50
  type: text-generation
@@ -60,7 +63,8 @@ model-index:
60
  value: 23.04
61
  name: exact match
62
  source:
63
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
 
64
  name: Open LLM Leaderboard
65
  - task:
66
  type: text-generation
@@ -76,7 +80,8 @@ model-index:
76
  value: 14.09
77
  name: acc_norm
78
  source:
79
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
 
80
  name: Open LLM Leaderboard
81
  - task:
82
  type: text-generation
@@ -91,7 +96,8 @@ model-index:
91
  value: 17.69
92
  name: acc_norm
93
  source:
94
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
 
95
  name: Open LLM Leaderboard
96
  - task:
97
  type: text-generation
@@ -108,7 +114,8 @@ model-index:
108
  value: 46.1
109
  name: accuracy
110
  source:
111
- url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
 
112
  name: Open LLM Leaderboard
113
  ---
114
 
@@ -212,5 +219,4 @@ Summarized results can be found [here](https://huggingface.co/datasets/open-llm-
212
  |MATH Lvl 5 (4-Shot)| 23.04|
213
  |GPQA (0-shot) | 14.09|
214
  |MuSR (0-shot) | 17.69|
215
- |MMLU-PRO (5-shot) | 46.10|
216
-
 
11
  - Calcium
12
  - Opus
13
  - 14B
14
+ - qwq
15
  model-index:
16
  - name: Calcium-Opus-14B-Elite4
17
  results:
 
29
  value: 61.12
30
  name: averaged accuracy
31
  source:
32
+ url: >-
33
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
34
  name: Open LLM Leaderboard
35
  - task:
36
  type: text-generation
 
46
  value: 45.21
47
  name: normalized accuracy
48
  source:
49
+ url: >-
50
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
51
  name: Open LLM Leaderboard
52
  - task:
53
  type: text-generation
 
63
  value: 23.04
64
  name: exact match
65
  source:
66
+ url: >-
67
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
68
  name: Open LLM Leaderboard
69
  - task:
70
  type: text-generation
 
80
  value: 14.09
81
  name: acc_norm
82
  source:
83
+ url: >-
84
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
85
  name: Open LLM Leaderboard
86
  - task:
87
  type: text-generation
 
96
  value: 17.69
97
  name: acc_norm
98
  source:
99
+ url: >-
100
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
101
  name: Open LLM Leaderboard
102
  - task:
103
  type: text-generation
 
114
  value: 46.1
115
  name: accuracy
116
  source:
117
+ url: >-
118
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard#/?search=prithivMLmods%2FCalcium-Opus-14B-Elite4
119
  name: Open LLM Leaderboard
120
  ---
121
 
 
219
  |MATH Lvl 5 (4-Shot)| 23.04|
220
  |GPQA (0-shot) | 14.09|
221
  |MuSR (0-shot) | 17.69|
222
+ |MMLU-PRO (5-shot) | 46.10|