Spaces:
Running
on
CPU Upgrade
Running
on
CPU Upgrade
fix generation bugs
Browse files
src/backend/run_eval_suite.py
CHANGED
@@ -32,8 +32,8 @@ def run_evaluation(eval_request: EvalRequest, task_names, num_fewshot, batch_siz
|
|
32 |
|
33 |
print(f"Selected Tasks: {task_names}")
|
34 |
print(f"Eval Request: {eval_request.get_model_args()}")
|
35 |
-
|
36 |
-
results = evaluator.simple_evaluate(model="hf-
|
37 |
model_args=eval_request.get_model_args(),
|
38 |
tasks=task_names,
|
39 |
num_fewshot=num_fewshot,
|
|
|
32 |
|
33 |
print(f"Selected Tasks: {task_names}")
|
34 |
print(f"Eval Request: {eval_request.get_model_args()}")
|
35 |
+
# hf-chat is implemented to use apply_chat_template
|
36 |
+
results = evaluator.simple_evaluate(model="hf-auto", # "hf-causal-experimental", # "hf-causal", hf-chat
|
37 |
model_args=eval_request.get_model_args(),
|
38 |
tasks=task_names,
|
39 |
num_fewshot=num_fewshot,
|