djstrong commited on
Commit
c6c119a
1 Parent(s): 1708479
Files changed (2) hide show
  1. src/about.py +3 -1
  2. src/display/utils.py +2 -1
src/about.py CHANGED
@@ -40,7 +40,9 @@ class Tasks(Enum):
40
  task25 = Task("polish_eq_bench_first_turn", "first_eqbench,none", "eq_bench_first_turn", "generate_until", 0.0)
41
  task26 = Task("polish_eq_bench", "average_eqbench,none", "eq_bench", "generate_until", 0.0)
42
  task20 = Task("polish_poleval2018_task3_test_10k", "word_perplexity,none", "poleval2018_task3_test_10k", "other")
43
- # task27 = Task("polish_eq_bench", "revised_eqbench,none", "eq_bench_revised", "other", 0.0)
 
 
44
 
45
 
46
  g_tasks = [task.value.benchmark for task in Tasks if task.value.type == "generate_until"]
 
40
  task25 = Task("polish_eq_bench_first_turn", "first_eqbench,none", "eq_bench_first_turn", "generate_until", 0.0)
41
  task26 = Task("polish_eq_bench", "average_eqbench,none", "eq_bench", "generate_until", 0.0)
42
  task20 = Task("polish_poleval2018_task3_test_10k", "word_perplexity,none", "poleval2018_task3_test_10k", "other")
43
+ task27 = Task("polish_poquad_reranking", "acc,none", "poquad_reranking", "other", 0.0)
44
+ task28 = Task("polish_abstractive_poquad_rag", "levenshtein,none", "abstractive_poquad_rag", "other", 0.0)
45
+ task29 = Task("polish_abstractive_poquad_open_book", "levenshtein,none", "abstractive_poquad_open_book", "other", 0.0)
46
 
47
 
48
  g_tasks = [task.value.benchmark for task in Tasks if task.value.type == "generate_until"]
src/display/utils.py CHANGED
@@ -37,7 +37,8 @@ auto_eval_column_dict.append(["average_mc", ColumnContent, ColumnContent("Avg mc
37
  auto_eval_column_dict.append(["average_rag", ColumnContent, ColumnContent("Avg RAG", "number", True)])
38
 
39
  for task in Tasks:
40
- auto_eval_column_dict.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", True)])
 
41
  # Model information
42
 
43
  auto_eval_column_dict.append(["model_type", ColumnContent, ColumnContent("Type", "str", False)])
 
37
  auto_eval_column_dict.append(["average_rag", ColumnContent, ColumnContent("Avg RAG", "number", True)])
38
 
39
  for task in Tasks:
40
+ show = task.name not in ['polish_poquad_reranking','polish_abstractive_poquad_rag','polish_abstractive_poquad_open_book']
41
+ auto_eval_column_dict.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", show)])
42
  # Model information
43
 
44
  auto_eval_column_dict.append(["model_type", ColumnContent, ColumnContent("Type", "str", False)])