Spaces:
Sleeping
Sleeping
Update app.py
Browse files
app.py
CHANGED
@@ -4,7 +4,7 @@ from transformers import AutoTokenizer, AutoModelForCausalLM
|
|
4 |
import os
|
5 |
from huggingface_hub import login
|
6 |
from toy_dataset_eval import evaluate_toy_dataset
|
7 |
-
from mmlu_eval_original import
|
8 |
import spaces
|
9 |
import pandas as pd
|
10 |
|
@@ -93,7 +93,8 @@ def run_mmlu_evaluation(all_subjects, num_subjects, num_shots, all_questions, nu
|
|
93 |
tokenizer,
|
94 |
num_subjects=num_subjects,
|
95 |
num_questions=num_questions,
|
96 |
-
num_shots=num_shots
|
|
|
97 |
)
|
98 |
|
99 |
# Format results
|
|
|
4 |
import os
|
5 |
from huggingface_hub import login
|
6 |
from toy_dataset_eval import evaluate_toy_dataset
|
7 |
+
from mmlu_eval_original import evaluate_mmlu_batched
|
8 |
import spaces
|
9 |
import pandas as pd
|
10 |
|
|
|
93 |
tokenizer,
|
94 |
num_subjects=num_subjects,
|
95 |
num_questions=num_questions,
|
96 |
+
num_shots=num_shots,
|
97 |
+
auto_batch_size=True
|
98 |
)
|
99 |
|
100 |
# Format results
|