Spaces:
Sleeping
Sleeping
Update mmlu_eval
Browse files
mmlu_eval
CHANGED
|
@@ -8,7 +8,7 @@ from transformers import AutoTokenizer, AutoModelForCausalLM
|
|
| 8 |
accuracy_metric = evaluate.load("accuracy")
|
| 9 |
|
| 10 |
# Load MMLU dataset
|
| 11 |
-
mmlu_dataset = load_dataset("
|
| 12 |
|
| 13 |
def generate_answer(model, tokenizer, question):
|
| 14 |
"""
|
|
|
|
| 8 |
accuracy_metric = evaluate.load("accuracy")
|
| 9 |
|
| 10 |
# Load MMLU dataset
|
| 11 |
+
mmlu_dataset = load_dataset("cais/mmlu", "all")
|
| 12 |
|
| 13 |
def generate_answer(model, tokenizer, question):
|
| 14 |
"""
|