Spaces:
Sleeping
Sleeping
Update mmlu_eval
Browse files
mmlu_eval
CHANGED
@@ -8,7 +8,7 @@ from transformers import AutoTokenizer, AutoModelForCausalLM
|
|
8 |
accuracy_metric = evaluate.load("accuracy")
|
9 |
|
10 |
# Load MMLU dataset
|
11 |
-
mmlu_dataset = load_dataset("
|
12 |
|
13 |
def generate_answer(model, tokenizer, question):
|
14 |
"""
|
|
|
8 |
accuracy_metric = evaluate.load("accuracy")
|
9 |
|
10 |
# Load MMLU dataset
|
11 |
+
mmlu_dataset = load_dataset("cais/mmlu", "all")
|
12 |
|
13 |
def generate_answer(model, tokenizer, question):
|
14 |
"""
|