Remove all extended
Browse filesThis view is limited to 50 files because it contains too many changes.
See raw diff
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T08-24-28.663476.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T11-53-10.460117.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T11-53-43.320597.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T11-54-56.034580.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-02-03.876241.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-02-45.345868.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-10-05.892099.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-10-51.069893.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-11-09.142582.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-11-52.699054.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T07-52-17.741228.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-46-31.254392.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-47-22.155023.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-48-08.323537.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-49-19.457760.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-55-50.195477.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-56-37.842002.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T12-04-15.614023.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T12-05-03.205567.json +0 -9
- eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T12-05-19.461439.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-35-55.319691.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-39.154099.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-45.465309.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-51.762138.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-57.646782.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-37-34.914869.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-30-19.795635.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-31-17.070563.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-31-20.591558.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-31-22.828801.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-31-22.992274.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-31-58.832163.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-32-00.817395.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-32-04.874285.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-35-43.587013.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-33.915430.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-46.325504.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-53.077942.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-37-09.839521.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-37-10.256361.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-37-38.369986.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-30-24.474723.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-30-33.818723.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-32-37.769119.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-32-44.724632.json +0 -9
- eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-33-02.264328.json +0 -9
- eval_results/AI-MO/deepseek-math-7b-sft/aimo_v36.28.gptq-8bits/aimo_kaggle_tora_hard_extended/results_2024-06-16T14-57-18.666545.json +0 -9
- eval_results/AI-MO/deepseek-math-7b-sft/aimo_v36.28.gptq-8bits/aimo_kaggle_tora_hard_extended/results_2024-06-16T14-58-23.144488.json +0 -9
- eval_results/AI-MO/deepseek-math-7b-sft/aimo_v36.28.gptq-8bits/aimo_kaggle_tora_hard_extended/results_2024-06-16T14-58-25.920185.json +0 -9
- eval_results/AI-MO/deepseek-math-7b-sft/aimo_v36.28.gptq-8bits/aimo_kaggle_tora_hard_extended/results_2024-06-16T14-58-34.933827.json +0 -9
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T08-24-28.663476.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 22.22222222222222
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T11-53-10.460117.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 22.22222222222222
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T11-53-43.320597.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 23.333333333333332
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T11-54-56.034580.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 22.22222222222222
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-02-03.876241.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 23.333333333333332
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-02-45.345868.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 23.333333333333332
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-10-05.892099.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 23.333333333333332
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-10-51.069893.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 23.333333333333332
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-11-09.142582.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 24.444444444444443
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_hard_extended/results_2024-06-16T12-11-52.699054.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 22.22222222222222
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T07-52-17.741228.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 48.19277108433735
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-46-31.254392.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 45.78313253012048
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-47-22.155023.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 45.78313253012048
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-48-08.323537.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 42.16867469879518
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-49-19.457760.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 44.57831325301205
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-55-50.195477.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 45.78313253012048
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T11-56-37.842002.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 42.16867469879518
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T12-04-15.614023.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 40.963855421686745
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T12-05-03.205567.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 45.78313253012048
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/CodeLlama-34b-Python-hf-sft/aimo_v02.01/aimo_kaggle_tora_medium_extended/results_2024-06-16T12-05-19.461439.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/CodeLlama-34b-Python-hf-sft",
|
3 |
-
"model_revision": "aimo_v02.01",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 42.16867469879518
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-35-55.319691.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 27.77777777777778
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-39.154099.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 28.88888888888889
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-45.465309.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 28.88888888888889
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-51.762138.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 30.0
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-57.646782.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 30.0
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-37-34.914869.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 30.0
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-30-19.795635.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 43.373493975903614
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-31-17.070563.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 45.78313253012048
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-31-20.591558.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 42.16867469879518
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-31-22.828801.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 44.57831325301205
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-31-22.992274.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 43.373493975903614
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-31-58.832163.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 44.57831325301205
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-32-00.817395.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 45.78313253012048
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.16/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-32-04.874285.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.16",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 44.57831325301205
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-35-43.587013.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 26.666666666666668
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-33.915430.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 28.88888888888889
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-46.325504.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 26.666666666666668
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-36-53.077942.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 24.444444444444443
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-37-09.839521.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 25.555555555555557
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-37-10.256361.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 26.666666666666668
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_hard_extended/results_2024-06-17T07-37-38.369986.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 27.77777777777778
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-30-24.474723.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 43.373493975903614
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-30-33.818723.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 43.373493975903614
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-32-37.769119.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 42.16867469879518
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-32-44.724632.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 42.16867469879518
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-coder-33b-sft/aimo_v05.20/aimo_kaggle_tora_medium_extended/results_2024-06-17T07-33-02.264328.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-coder-33b-sft",
|
3 |
-
"model_revision": "aimo_v05.20",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_medium_extended": {
|
6 |
-
"qem": 44.57831325301205
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-math-7b-sft/aimo_v36.28.gptq-8bits/aimo_kaggle_tora_hard_extended/results_2024-06-16T14-57-18.666545.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-math-7b-sft",
|
3 |
-
"model_revision": "aimo_v36.28.gptq-8bits",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 26.666666666666668
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-math-7b-sft/aimo_v36.28.gptq-8bits/aimo_kaggle_tora_hard_extended/results_2024-06-16T14-58-23.144488.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-math-7b-sft",
|
3 |
-
"model_revision": "aimo_v36.28.gptq-8bits",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 27.77777777777778
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-math-7b-sft/aimo_v36.28.gptq-8bits/aimo_kaggle_tora_hard_extended/results_2024-06-16T14-58-25.920185.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-math-7b-sft",
|
3 |
-
"model_revision": "aimo_v36.28.gptq-8bits",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 26.666666666666668
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
eval_results/AI-MO/deepseek-math-7b-sft/aimo_v36.28.gptq-8bits/aimo_kaggle_tora_hard_extended/results_2024-06-16T14-58-34.933827.json
DELETED
@@ -1,9 +0,0 @@
|
|
1 |
-
{
|
2 |
-
"model_name": "AI-MO/deepseek-math-7b-sft",
|
3 |
-
"model_revision": "aimo_v36.28.gptq-8bits",
|
4 |
-
"results": {
|
5 |
-
"aimo_kaggle_tora_hard_extended": {
|
6 |
-
"qem": 26.666666666666668
|
7 |
-
}
|
8 |
-
}
|
9 |
-
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|