asharsha30 commited on
Commit
8ce3503
·
verified ·
1 Parent(s): 80e318f

Update README.md

Browse files
Files changed (1) hide show
  1. README.md +114 -100
README.md CHANGED
@@ -1,102 +1,118 @@
1
  ---
2
  library_name: transformers
3
- tags: []
4
- # #model-index:
5
- # - name: LLAMA_Harsha_8_B_ORDP_10k
6
- # results:
7
- # - task:
8
- # type: text-generation
9
- # name: Text Generation
10
- # dataset:
11
- # name: IFEval (0-Shot)
12
- # type: HuggingFaceH4/ifeval
13
- # args:
14
- # num_few_shot: 0
15
- # metrics:
16
- # - type: inst_level_strict_acc and prompt_level_strict_acc
17
- # value: 34.64
18
- # name: strict accuracy
19
- # source:
20
- # url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
21
- # name: Open LLM Leaderboard
22
- # - task:
23
- # type: text-generation
24
- # name: Text Generation
25
- # dataset:
26
- # name: BBH (3-Shot)
27
- # type: BBH
28
- # args:
29
- # num_few_shot: 3
30
- # metrics:
31
- # - type: acc_norm
32
- # value: 25.73
33
- # name: normalized accuracy
34
- # source:
35
- # url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
36
- # name: Open LLM Leaderboard
37
- # - task:
38
- # type: text-generation
39
- # name: Text Generation
40
- # dataset:
41
- # name: MATH Lvl 5 (4-Shot)
42
- # type: hendrycks/competition_math
43
- # args:
44
- # num_few_shot: 4
45
- # metrics:
46
- # - type: exact_match
47
- # value: 5.21
48
- # name: exact match
49
- # source:
50
- # url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
51
- # name: Open LLM Leaderboard
52
- # - task:
53
- # type: text-generation
54
- # name: Text Generation
55
- # dataset:
56
- # name: GPQA (0-shot)
57
- # type: Idavidrein/gpqa
58
- # args:
59
- # num_few_shot: 0
60
- # metrics:
61
- # - type: acc_norm
62
- # value: 3.13
63
- # name: acc_norm
64
- # source:
65
- # url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
66
- # name: Open LLM Leaderboard
67
- # - task:
68
- # type: text-generation
69
- # name: Text Generation
70
- # dataset:
71
- # name: MuSR (0-shot)
72
- # type: TAUR-Lab/MuSR
73
- # args:
74
- # num_few_shot: 0
75
- # metrics:
76
- # - type: acc_norm
77
- # value: 7.07
78
- # name: acc_norm
79
- # source:
80
- # url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
81
- # name: Open LLM Leaderboard
82
- # - task:
83
- # type: text-generation
84
- # name: Text Generation
85
- # dataset:
86
- # name: MMLU-PRO (5-shot)
87
- # type: TIGER-Lab/MMLU-Pro
88
- # config: main
89
- # split: test
90
- # args:
91
- # num_few_shot: 5
92
- # metrics:
93
- # - type: acc
94
- # value: 20.11
95
- # name: accuracy
96
- # source:
97
- # url: https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
98
- # name: Open LLM Leaderboard
99
- # ---
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
100
 
101
  # Model Card for Model ID
102
 
@@ -373,6 +389,4 @@ Average: 37.96%
373
 
374
  Average score: 50.01%
375
 
376
- Elapsed time: 02:36:38
377
-
378
-
 
1
  ---
2
  library_name: transformers
3
+ tags:
4
+ - orpo
5
+ - llama3-8B
6
+ - Supervised_Training
7
+ model-index:
8
+ - name: LLAMA_Harsha_8_B_ORDP_10k
9
+ results:
10
+ - task:
11
+ type: text-generation
12
+ name: Text Generation
13
+ dataset:
14
+ name: IFEval (0-Shot)
15
+ type: HuggingFaceH4/ifeval
16
+ args:
17
+ num_few_shot: 0
18
+ metrics:
19
+ - type: inst_level_strict_acc and prompt_level_strict_acc
20
+ value: 34.64
21
+ name: strict accuracy
22
+ source:
23
+ url: >-
24
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
25
+ name: Open LLM Leaderboard
26
+ - task:
27
+ type: text-generation
28
+ name: Text Generation
29
+ dataset:
30
+ name: BBH (3-Shot)
31
+ type: BBH
32
+ args:
33
+ num_few_shot: 3
34
+ metrics:
35
+ - type: acc_norm
36
+ value: 25.73
37
+ name: normalized accuracy
38
+ source:
39
+ url: >-
40
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
41
+ name: Open LLM Leaderboard
42
+ - task:
43
+ type: text-generation
44
+ name: Text Generation
45
+ dataset:
46
+ name: MATH Lvl 5 (4-Shot)
47
+ type: hendrycks/competition_math
48
+ args:
49
+ num_few_shot: 4
50
+ metrics:
51
+ - type: exact_match
52
+ value: 5.21
53
+ name: exact match
54
+ source:
55
+ url: >-
56
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
57
+ name: Open LLM Leaderboard
58
+ - task:
59
+ type: text-generation
60
+ name: Text Generation
61
+ dataset:
62
+ name: GPQA (0-shot)
63
+ type: Idavidrein/gpqa
64
+ args:
65
+ num_few_shot: 0
66
+ metrics:
67
+ - type: acc_norm
68
+ value: 3.13
69
+ name: acc_norm
70
+ source:
71
+ url: >-
72
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
73
+ name: Open LLM Leaderboard
74
+ - task:
75
+ type: text-generation
76
+ name: Text Generation
77
+ dataset:
78
+ name: MuSR (0-shot)
79
+ type: TAUR-Lab/MuSR
80
+ args:
81
+ num_few_shot: 0
82
+ metrics:
83
+ - type: acc_norm
84
+ value: 7.07
85
+ name: acc_norm
86
+ source:
87
+ url: >-
88
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
89
+ name: Open LLM Leaderboard
90
+ - task:
91
+ type: text-generation
92
+ name: Text Generation
93
+ dataset:
94
+ name: MMLU-PRO (5-shot)
95
+ type: TIGER-Lab/MMLU-Pro
96
+ config: main
97
+ split: test
98
+ args:
99
+ num_few_shot: 5
100
+ metrics:
101
+ - type: acc
102
+ value: 20.11
103
+ name: accuracy
104
+ source:
105
+ url: >-
106
+ https://huggingface.co/spaces/open-llm-leaderboard/open_llm_leaderboard?query=asharsha30/LLAMA_Harsha_8_B_ORDP_10k
107
+ name: Open LLM Leaderboard
108
+ license: apache-2.0
109
+ datasets:
110
+ - mlabonne/orpo-dpo-mix-40k
111
+ language:
112
+ - en
113
+ base_model:
114
+ - meta-llama/Llama-3.1-8B
115
+ ---
116
 
117
  # Model Card for Model ID
118
 
 
389
 
390
  Average score: 50.01%
391
 
392
+ Elapsed time: 02:36:38