Spaces:
Runtime error
Runtime error
from dataclasses import dataclass | |
class Task: | |
code: str | |
name: str | |
metric: str | |
higher_is_better: bool = True | |
num_fewshot: int = 0 | |
private_test: bool = False | |
class Lambada(Task): | |
code = "lambada_vi" | |
name = "LAMBADA-vi" | |
metric = "ppl" | |
higher_is_better = False | |
num_fewshot = 0 | |
private_test: bool = True | |
class Arc(Task): | |
code = "arc_vi" | |
name = "ARC-vi" | |
metric = "acc_norm" | |
higher_is_better = True | |
num_fewshot = 25 | |
private_test: bool = False | |
class HellaSwag(Task): | |
code = "hellaswag_vi" | |
name = "HellaSwag-vi" | |
metric = "acc_norm" | |
higher_is_better = True | |
num_fewshot = 10 | |
private_test: bool = False | |
class MMLU(Task): | |
code = "mmlu_vi" | |
name = "MMLU-vi" | |
metric = "acc_norm" | |
higher_is_better = True | |
num_fewshot = 5 | |
private_test: bool = False | |
class TruthfulQA(Task): | |
code = "truthfulqa_vi" | |
name = "TruthfulQA-vi" | |
metric = "mc2" | |
higher_is_better = True | |
num_fewshot = 0 | |
private_test: bool = False | |
class Grade12Exams(Task): | |
code = "grade_12_exams_vi" | |
name = "Grade 12 Exams" | |
metric = "acc_norm" | |
higher_is_better = True | |
num_fewshot = 5 | |
private_test: bool = False | |
class IWSLT2023_en_vi(Task): | |
code = "translation_vi" | |
name = "IWSLT 2023 en-vi" | |
metric = "bleu" | |
higher_is_better = True | |
num_fewshot = 0 | |
private_test: bool = False | |
class WikipediaQA(Task): | |
code = "wikipediaqa_vi" | |
name = "GeneralKnowledgeQA-vi" | |
metric = "acc_norm" | |
higher_is_better = True | |
num_fewshot = 5 | |
private_test: bool = True | |
class Comprehension(Task): | |
code = "comprehension_vi" | |
name = "ComprehensionQA-vi" | |
metric = "acc_norm" | |
higher_is_better = True | |
num_fewshot = 0 | |
private_test: bool = True | |
class Exams(Task): | |
code = "exams_vi" | |
name = "Exams-vi" | |
metric = "acc_norm" | |
higher_is_better = True | |
num_fewshot = 5 | |
private_test: bool = True | |
TASKS = [Arc, HellaSwag, MMLU, TruthfulQA] + [Lambada, WikipediaQA, Comprehension, Exams] |