Spaces:

Weyaxi
/

leaderboard-results-to-modelcard

Running

Weyaxi commited on Jun 27

Commit

cb862a5

•

1 Parent(s): 1148fdd

metadata fixed

Files changed (1) hide show

functions.py CHANGED Viewed

@@ -41,7 +41,7 @@ def get_task_summary(results):
       "IFEval":
           {"dataset_type":"HuggingFaceH4/ifeval",
           "dataset_name":"IFEval (0-Shot)",
-          "metric_type":"inst_level_strict_acc",
           "metric_value":results["IFEval"],
           "dataset_config": None, # don't know
           "dataset_split": None, # don't know
@@ -84,10 +84,10 @@ def get_task_summary(results):
           "dataset_args":{"num_few_shot": 0},
           "metric_name":"acc_norm"
       },
-      "MUSR":
       {
           "dataset_type":"TAUR-Lab/MuSR",
-          "dataset_name":"Winogrande (5-shot)",
           "metric_type":"acc_norm",
           "metric_value":results["MUSR"],
           "dataset_config": None, # don't know

       "IFEval":
           {"dataset_type":"HuggingFaceH4/ifeval",
           "dataset_name":"IFEval (0-Shot)",
+          "metric_type": ["inst_level_strict_acc", "prompt_level_strict_acc"],
           "metric_value":results["IFEval"],
           "dataset_config": None, # don't know
           "dataset_split": None, # don't know
           "dataset_args":{"num_few_shot": 0},
           "metric_name":"acc_norm"
       },
+      "MuSR":
       {
           "dataset_type":"TAUR-Lab/MuSR",
+          "dataset_name":"MuSR (0-shot)",
           "metric_type":"acc_norm",
           "metric_value":results["MUSR"],
           "dataset_config": None, # don't know