zhuohan-7 commited on
Commit
ab58981
1 Parent(s): aa4435c

Upload folder using huggingface_hub

Browse files
Files changed (2) hide show
  1. app/draw_diagram.py +11 -22
  2. app/pages.py +8 -2
app/draw_diagram.py CHANGED
@@ -7,20 +7,8 @@ import pandas as pd
7
 
8
  from model_information import get_dataframe
9
 
10
-
11
  info_df = get_dataframe()
12
 
13
-
14
- # path = "./style/Leaderboard-Rename-SeaEval.csv"
15
- # info_df = pd.read_csv(path).dropna(axis=0)
16
-
17
- #Model2Detail = {
18
- # {'cross_mmlu': 'Cross-MMLU'}
19
- #}
20
-
21
-
22
-
23
-
24
  def draw(folder_name, category_one, category_two, sort, num_sort, model_size_range):
25
 
26
  folder = f"./results/{folder_name}/"
@@ -77,16 +65,17 @@ def draw(folder_name, category_one, category_two, sort, num_sort, model_size_ran
77
  max_value = round(max(chart_data.iloc[:, 1]) + 0.1*max(chart_data.iloc[:, 1]), 1)
78
 
79
  display_names = {
80
- 'cross_mmlu' : 'Cross-MMLU',
81
- 'cross_logiqa' : 'Cross-LogiQA',
82
- 'cross_xquad' : 'Cross-XQUAD',
83
- 'sg_eval' : 'SG EVAL',
84
- 'sg_eval_v1_cleaned': 'SG EVAL V1 Cleaned',
85
- 'sg_eval_v2_mcq' : 'SG EVAL V2 MCQ',
86
- 'sg_eval_v2_open' : 'SG EVAL V2 Open Ended',
87
- 'us_eval' : 'US EVAL',
88
- 'cn_eval' : 'CN EVAL',
89
- 'ph_eval' : 'PH EVAL'
 
90
  }
91
 
92
  data_columns = [i for i in chart_data.columns if i not in ['Model', 'model_show']]
 
7
 
8
  from model_information import get_dataframe
9
 
 
10
  info_df = get_dataframe()
11
 
 
 
 
 
 
 
 
 
 
 
 
12
  def draw(folder_name, category_one, category_two, sort, num_sort, model_size_range):
13
 
14
  folder = f"./results/{folder_name}/"
 
65
  max_value = round(max(chart_data.iloc[:, 1]) + 0.1*max(chart_data.iloc[:, 1]), 1)
66
 
67
  display_names = {
68
+ 'cross_mmlu' : 'Cross-MMLU',
69
+ 'cross_logiqa' : 'Cross-LogiQA',
70
+ 'cross_xquad' : 'Cross-XQUAD',
71
+ 'cross_mmlu_no_prompt': 'Cross-MMLU-No-Prompt',
72
+ 'sg_eval' : 'SG EVAL',
73
+ 'sg_eval_v1_cleaned' : 'SG EVAL V1 Cleaned',
74
+ 'sg_eval_v2_mcq' : 'SG EVAL V2 MCQ',
75
+ 'sg_eval_v2_open' : 'SG EVAL V2 Open Ended',
76
+ 'us_eval' : 'US EVAL',
77
+ 'cn_eval' : 'CN EVAL',
78
+ 'ph_eval' : 'PH EVAL'
79
  }
80
 
81
  data_columns = [i for i in chart_data.columns if i not in ['Model', 'model_show']]
app/pages.py CHANGED
@@ -76,7 +76,12 @@ def cross_lingual_consistency():
76
  st.title("Task: Cross-Lingual Consistency")
77
 
78
  filters_levelone = ['Zero Shot', 'Few Shot']
79
- filters_leveltwo = ['Cross-MMLU', 'Cross-XQUAD', 'Cross-LogiQA']
 
 
 
 
 
80
 
81
  category_one_dict = {
82
  'Zero Shot': 'zero_shot',
@@ -86,7 +91,8 @@ def cross_lingual_consistency():
86
  category_two_dict = {
87
  'Cross-MMLU' : 'cross_mmlu',
88
  'Cross-XQUAD' : 'cross_xquad',
89
- 'Cross-LogiQA': 'cross_logiqa'
 
90
  }
91
 
92
  left, center, middle, _, right = st.columns([0.2, 0.2, 0.2, 0.2 ,0.2])
 
76
  st.title("Task: Cross-Lingual Consistency")
77
 
78
  filters_levelone = ['Zero Shot', 'Few Shot']
79
+ filters_leveltwo = [
80
+ 'Cross-MMLU',
81
+ 'Cross-XQUAD',
82
+ 'Cross-LogiQA',
83
+ 'Cross-MMLU-No-Prompt',
84
+ ]
85
 
86
  category_one_dict = {
87
  'Zero Shot': 'zero_shot',
 
91
  category_two_dict = {
92
  'Cross-MMLU' : 'cross_mmlu',
93
  'Cross-XQUAD' : 'cross_xquad',
94
+ 'Cross-LogiQA': 'cross_logiqa',
95
+ 'Cross-MMLU-No-Prompt': 'cross_mmlu_no_prompt'
96
  }
97
 
98
  left, center, middle, _, right = st.columns([0.2, 0.2, 0.2, 0.2 ,0.2])