Update README.md
Browse files
README.md
CHANGED
@@ -24,4 +24,23 @@ hf (pretrained=Lambent/Falcon3-Continued-0.3-10B-Base), gen_kwargs: (None), limi
|
|
24 |
| | |none | 0|acc_norm|↑ |0.7954|± |0.0094|
|
25 |
|sciq | 1|none | 0|acc |↑ |0.9620|± |0.0060|
|
26 |
| | |none | 0|acc_norm|↑ |0.9500|± |0.0069|
|
27 |
-
|winogrande | 1|none | 0|acc |↑ |0.7332|± |0.0124|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
24 |
| | |none | 0|acc_norm|↑ |0.7954|± |0.0094|
|
25 |
|sciq | 1|none | 0|acc |↑ |0.9620|± |0.0060|
|
26 |
| | |none | 0|acc_norm|↑ |0.9500|± |0.0069|
|
27 |
+
|winogrande | 1|none | 0|acc |↑ |0.7332|± |0.0124|
|
28 |
+
|
29 |
+
Original under same conditions:
|
30 |
+
|
31 |
+
hf (pretrained=tiiuae/Falcon3-10B-Base,dtype=auto,trust_remote_code=True), gen_kwargs: (None), limit: None, num_fewshot: 0, batch_size: auto
|
32 |
+
| Tasks |Version|Filter|n-shot| Metric | | Value | |Stderr|
|
33 |
+
|--------|------:|------|-----:|-----------------|---|-------:|---|-----:|
|
34 |
+
|eq_bench| 2.1|none | 0|eqbench |↑ | 60.9913|± |2.2402|
|
35 |
+
| | |none | 0|percent_parseable|↑ |100.0000|± |0.0000|
|
36 |
+
|
37 |
+
hf (pretrained=tiiuae/Falcon3-10B-Base), gen_kwargs: (None), limit: None, num_fewshot: None, batch_size: auto:4 (4,64,64,64)
|
38 |
+
| Tasks |Version|Filter|n-shot| Metric | |Value | |Stderr|
|
39 |
+
|-------------|------:|------|-----:|--------|---|-----:|---|-----:|
|
40 |
+
|arc_challenge| 1|none | 0|acc |↑ |0.5520|± |0.0145|
|
41 |
+
| | |none | 0|acc_norm|↑ |0.5887|± |0.0144|
|
42 |
+
|piqa | 1|none | 0|acc |↑ |0.7873|± |0.0095|
|
43 |
+
| | |none | 0|acc_norm|↑ |0.7949|± |0.0094|
|
44 |
+
|sciq | 1|none | 0|acc |↑ |0.9610|± |0.0061|
|
45 |
+
| | |none | 0|acc_norm|↑ |0.9360|± |0.0077|
|
46 |
+
|winogrande | 1|none | 0|acc |↑ |0.7364|± |0.0124|
|