djstrong commited on
Commit
d879a1e
1 Parent(s): fe596e9
Files changed (2) hide show
  1. src/about.py +1 -0
  2. src/display/utils.py +1 -1
src/about.py CHANGED
@@ -43,6 +43,7 @@ class Tasks(Enum):
43
  task27 = Task("polish_poquad_reranking", "acc,none", "poquad_reranking", "other", 0.0)
44
  task28 = Task("polish_abstractive_poquad_rag", "levenshtein,none", "abstractive_poquad_rag", "other", 0.0)
45
  task29 = Task("polish_abstractive_poquad_open_book", "levenshtein,none", "abstractive_poquad_open_book", "other", 0.0)
 
46
 
47
 
48
  g_tasks = [task.value.benchmark for task in Tasks if task.value.type == "generate_until"]
 
43
  task27 = Task("polish_poquad_reranking", "acc,none", "poquad_reranking", "other", 0.0)
44
  task28 = Task("polish_abstractive_poquad_rag", "levenshtein,none", "abstractive_poquad_rag", "other", 0.0)
45
  task29 = Task("polish_abstractive_poquad_open_book", "levenshtein,none", "abstractive_poquad_open_book", "other", 0.0)
46
+ task30 = Task("polish_pes_regex", "exact_match,score-first", "pes_g", "other", 0.2)
47
 
48
 
49
  g_tasks = [task.value.benchmark for task in Tasks if task.value.type == "generate_until"]
src/display/utils.py CHANGED
@@ -37,7 +37,7 @@ auto_eval_column_dict.append(["average_mc", ColumnContent, ColumnContent("Avg mc
37
  auto_eval_column_dict.append(["average_rag", ColumnContent, ColumnContent("Avg RAG", "number", True)])
38
 
39
  for task in Tasks:
40
- show = task.value.col_name not in ['poquad_reranking','abstractive_poquad_rag','abstractive_poquad_open_book']
41
  auto_eval_column_dict.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", show)])
42
  # Model information
43
 
 
37
  auto_eval_column_dict.append(["average_rag", ColumnContent, ColumnContent("Avg RAG", "number", True)])
38
 
39
  for task in Tasks:
40
+ show = task.value.col_name not in ['poquad_reranking','abstractive_poquad_rag','abstractive_poquad_open_book', 'pes_g']
41
  auto_eval_column_dict.append([task.name, ColumnContent, ColumnContent(task.value.col_name, "number", show)])
42
  # Model information
43