kevinpro commited on
Commit
4bdbb91
1 Parent(s): b220808
__pycache__/content.cpython-310.pyc ADDED
Binary file (1.66 kB). View file
 
__pycache__/css.cpython-310.pyc ADDED
Binary file (888 Bytes). View file
 
app.py CHANGED
@@ -79,34 +79,34 @@ MMLU_COL = "MMLU (25-shot)"
79
  TRUTHFULQA_COL = "TruthfulQA (0-shot)"
80
  NOTES_COL = "Notes" # For search only
81
 
82
- COLS = [MODEL_COL, LANG_COL, CODE_COL, AVERAGE_COL, ARC_COL, HELLASWAG_COL, MMLU_COL, TRUTHFULQA_COL, NOTES_COL]
83
- TYPES = ["str", "str", "str", "number", "number", "number", "number", "number", "str"]
84
 
85
 
86
 
87
  COLS = [MODEL_COL, MSVAMP_COL, MGSM_COL, MNUM_COL,NOTES_COL]
88
- TYPES = ["str", "number", "number", "number","str"]
89
 
90
 
91
 
92
  def get_leaderboard_df():
93
  df = list()
94
  results = [
95
- ["GPT-3.5-Turbo", 46.6, 42.2, 49.4],
96
- ["MAmmoTH 7B", 26.3, 21.3, 24.2],
97
- ["WizardMath 7B", 32.5, 23.0, 28.7],
98
- ["MetaMath 7B", 46.2, 37.0, 43.2],
99
- ["QAlign 7B", 57.2, 49.6, None],
100
- ["MathOctopus 7B", 41.2, 39.5, 37.1],
101
- ["MathOctopus-MAPO-DPO 7B(ours)🔥", 57.4, 41.6, 50.4],
102
- ["MetaMathOctopus 7B", 53.0, 45.5, 39.2],
103
- ["MetaMathOctopus-MAPO-DPO 7B(ours) 👑", 64.7, 51.6, 52.9],
104
- ["MistralMathOctopus 7B", 59.0, 58.0, 56.8],
105
- ["MistralMathOctopus-MAPO-DPO 7B(ours) 👑", 74.6, 67.3, 70.0]
 
 
106
  ]
107
 
108
- for i in results:
109
- i.append(i[0])
110
  df = pd.DataFrame.from_records(results, columns=COLS)
111
  df = df.sort_values(by=[ MSVAMP_COL], ascending=False)
112
  df = df[COLS]
@@ -116,18 +116,20 @@ def get_leaderboard_df():
116
  def get_leaderboard_13Bdf():
117
  df = list()
118
  results = [
119
- ["GPT-3.5-Turbo", 46.6, 42.2, 49.4],
120
- ["MAmmoTH 13B", 38.6, 28.9, 29.5],
121
- ["WizardMath 13B", 35.7, 28.3, 29.0],
122
- ["MetaMath 13B", 46.2, 43.9, 43.3],
123
- ["QAlign 13B", 62.6, 57.1, None],
124
- ["MathOctopus 13B", 51.8, 46.0, 40.3],
125
- ["MathOctopus-MAPO-DPO 13B (ours) 🔥", 60.1, 48.5, 53.8],
126
- ["MetaMathOctopus 13B", 56.3, 51.4, 49.5],
127
- ["MetaMathOctopus-MAPO-DPO 13B (ours) 👑", 67.0, 58.0, 59.8]
 
 
128
  ]
129
- for i in results:
130
- i.append(i[0])
131
  df = pd.DataFrame.from_records(results, columns=COLS)
132
  df = df.sort_values(by=[ MSVAMP_COL], ascending=False)
133
  df = df[COLS]
@@ -149,7 +151,7 @@ with demo:
149
  gr.Markdown(INTRO_TEXT, elem_classes="markdown-text")
150
  #gr.Markdown(HOW_TO, elem_classes="markdown-text")
151
 
152
- with gr.Box():
153
  search_bar = gr.Textbox(
154
  placeholder="Search models and languages...", show_label=False, elem_id="search-bar"
155
  )
@@ -158,13 +160,12 @@ with demo:
158
  value=original_df,
159
  headers=COLS,
160
  datatype=TYPES,
161
- max_rows=5,
162
  elem_id="leaderboard-table",
163
  )
164
 
165
  # # Dummy leaderboard for handling the case when the user uses backspace key
166
  hidden_leaderboard_table_for_search = gr.components.Dataframe(
167
- value=original_df, headers=COLS, datatype=TYPES, max_rows=5, visible=False
168
  )
169
 
170
  search_bar.change(
@@ -173,7 +174,7 @@ with demo:
173
  leaderboard_table,
174
  )
175
 
176
- with gr.Box():
177
  search_bar = gr.Textbox(
178
  placeholder="Search models and languages...", show_label=False, elem_id="search-bar"
179
  )
@@ -182,13 +183,12 @@ with demo:
182
  value=original_13Bdf,
183
  headers=COLS,
184
  datatype=TYPES,
185
- max_rows=5,
186
  elem_id="leaderboard-table",
187
  )
188
 
189
  # # Dummy leaderboard for handling the case when the user uses backspace key
190
  hidden_leaderboard_table_for_search_13B = gr.components.Dataframe(
191
- value=original_13Bdf, headers=COLS, datatype=TYPES, max_rows=5, visible=False
192
  )
193
 
194
  search_bar.change(
@@ -197,7 +197,6 @@ with demo:
197
  leaderboard_table_13B,
198
  )
199
 
200
- #gr.Markdown(CREDIT, elem_classes="markdown-text")
201
  gr.Markdown(CITATION, elem_classes="markdown-text")
202
 
203
  demo.launch()
 
79
  TRUTHFULQA_COL = "TruthfulQA (0-shot)"
80
  NOTES_COL = "Notes" # For search only
81
 
82
+ # COLS = [MODEL_COL, LANG_COL, CODE_COL, AVERAGE_COL, ARC_COL, HELLASWAG_COL, MMLU_COL, TRUTHFULQA_COL, NOTES_COL]
83
+ # TYPES = ["str", "str", "str", "number", "number", "number", "number", "number", "str"]
84
 
85
 
86
 
87
  COLS = [MODEL_COL, MSVAMP_COL, MGSM_COL, MNUM_COL,NOTES_COL]
88
+ TYPES = ["str", "number", "number", "number","html"]
89
 
90
 
91
 
92
  def get_leaderboard_df():
93
  df = list()
94
  results = [
95
+ ["GPT-3.5-Turbo", 46.6, 42.2, 49.4,'GPT-3.5-Turbo'],
96
+ ["MAmmoTH 7B", 26.3, 21.3, 24.2,'<a href="https://arxiv.org/abs/2309.05653" target="_blank">MAmmoTH</a>'],
97
+ ["WizardMath 7B", 32.5, 23.0, 28.7,'<a href="https://arxiv.org/abs/2308.09583" target="_blank">WizardMath</a>'],
98
+ ["MetaMath 7B", 46.2, 37.0, 43.2,'<a href="https://arxiv.org/abs/2309.12284" target="_blank">MetaMath</a>'],
99
+ ["MetaMath-LB-9B",None,50.2,None,'<a href="https://arxiv.org/abs/2401.10695" target="_blank">LangBridge</a>'],
100
+ ["XCoT 7B",42.9,41.5,None,'<a href="https://arxiv.org/abs/2401.07037" target="_blank">XCoT</a>'],
101
+ ["QAlign 7B", 57.2, 49.6, None,'<a href="https://arxiv.org/abs/2401.07817" target="_blank">QAlign</a>'],
102
+ ["MathOctopus 7B", 41.2, 39.5, 37.1,'<a href="https://arxiv.org/abs/2310.20246" target="_blank">MathOctopus</a>'],
103
+ ["MathOctopus-MAPO-DPO 7B", 57.4, 41.6, 50.4,'<a href="https://arxiv.org/abs/2401.06838" target="_blank">MAPO</a>'],
104
+ ["MetaMathOctopus 7B", 53.0, 45.5, 39.2,'<a href="https://arxiv.org/abs/2401.06838" target="_blank">MAPO</a>'],
105
+ ["MetaMathOctopus-MAPO-DPO 7B 👑", 64.7, 51.6, 52.9,'<a href="https://arxiv.org/abs/2401.06838" target="_blank">MAPO</a>'],
106
+ ["MistralMathOctopus 7B", 59.0, 58.0, 56.8,'<a href="https://arxiv.org/abs/2401.06838" target="_blank">MAPO</a>'],
107
+ ["MistralMathOctopus-MAPO-DPO 7B 👑", 74.6, 67.3, 70.0,'<a href="https://arxiv.org/abs/2401.06838" target="_blank">MAPO</a>'],
108
  ]
109
 
 
 
110
  df = pd.DataFrame.from_records(results, columns=COLS)
111
  df = df.sort_values(by=[ MSVAMP_COL], ascending=False)
112
  df = df[COLS]
 
116
  def get_leaderboard_13Bdf():
117
  df = list()
118
  results = [
119
+ ["GPT-3.5-Turbo", 46.6, 42.2, 49.4,'GPT-3.5-Turbo'],
120
+ ["MAmmoTH 13B", 38.6, 28.9, 29.5,'<a href="https://arxiv.org/abs/2309.05653" target="_blank">MAmmoTH</a>'],
121
+ ["WizardMath 13B", 35.7, 28.3, 29.0,'<a href="https://arxiv.org/abs/2308.09583" target="_blank">WizardMath</a>'],
122
+ ["MetaMath 13B", 46.2, 43.9, 43.3,'<a href="https://arxiv.org/abs/2309.12284" target="_blank">MetaMath</a>'],
123
+ ["QAlign 13B", 62.6, 57.1, None,'<a href="https://arxiv.org/abs/2401.07817" target="_blank">QAlign</a>'],
124
+ ["MathOctopus 13B", 51.8, 46.0, 40.3,'<a href="https://arxiv.org/abs/2310.20246" target="_blank">MathOctopus</a>'],
125
+ ["MetaMath-LB-15B",None,55.2,None,'<a href="https://arxiv.org/abs/2401.10695" target="_blank">LangBridge</a>'],
126
+ ["MetaMath-LB-20B",None,56.7,None,'<a href="https://arxiv.org/abs/2401.10695" target="_blank">LangBridge</a>'],
127
+ ["MathOctopus-MAPO-DPO 13B ", 60.1, 48.5, 53.8,'<a href="https://arxiv.org/abs/2401.06838" target="_blank">MAPO</a>'],
128
+ ["MetaMathOctopus 13B", 56.3, 51.4, 49.5,'<a href="https://arxiv.org/abs/2401.06838" target="_blank">MAPO</a>'],
129
+ ["MetaMathOctopus-MAPO-DPO 13B 👑", 67.0, 58.0, 59.8,'<a href="https://arxiv.org/abs/2401.06838" target="_blank">MAPO</a>'],
130
  ]
131
+ # for i in results:
132
+ # i.append(i[0])
133
  df = pd.DataFrame.from_records(results, columns=COLS)
134
  df = df.sort_values(by=[ MSVAMP_COL], ascending=False)
135
  df = df[COLS]
 
151
  gr.Markdown(INTRO_TEXT, elem_classes="markdown-text")
152
  #gr.Markdown(HOW_TO, elem_classes="markdown-text")
153
 
154
+ with gr.Group():
155
  search_bar = gr.Textbox(
156
  placeholder="Search models and languages...", show_label=False, elem_id="search-bar"
157
  )
 
160
  value=original_df,
161
  headers=COLS,
162
  datatype=TYPES,
 
163
  elem_id="leaderboard-table",
164
  )
165
 
166
  # # Dummy leaderboard for handling the case when the user uses backspace key
167
  hidden_leaderboard_table_for_search = gr.components.Dataframe(
168
+ value=original_df, headers=COLS, datatype=TYPES, visible=False
169
  )
170
 
171
  search_bar.change(
 
174
  leaderboard_table,
175
  )
176
 
177
+ with gr.Group():
178
  search_bar = gr.Textbox(
179
  placeholder="Search models and languages...", show_label=False, elem_id="search-bar"
180
  )
 
183
  value=original_13Bdf,
184
  headers=COLS,
185
  datatype=TYPES,
 
186
  elem_id="leaderboard-table",
187
  )
188
 
189
  # # Dummy leaderboard for handling the case when the user uses backspace key
190
  hidden_leaderboard_table_for_search_13B = gr.components.Dataframe(
191
+ value=original_13Bdf, headers=COLS, datatype=TYPES, visible=False
192
  )
193
 
194
  search_bar.change(
 
197
  leaderboard_table_13B,
198
  )
199
 
 
200
  gr.Markdown(CITATION, elem_classes="markdown-text")
201
 
202
  demo.launch()
css.py CHANGED
@@ -1,15 +1,27 @@
 
1
  CUSTOM_CSS = """
2
- /* Hides the final column */
3
- table td:last-child,
4
- table th:last-child {
5
- display: none;
6
- }
7
-
8
- /* 控制第一列的宽度 */
9
- table td:first-child,
10
- table th:first-child {
11
- max-width: 200px;
12
- overflow: auto;
13
- white-space: nowrap;
 
 
 
 
 
 
 
 
 
 
 
14
  }
15
  """
 
1
+ # css.py 文件
2
  CUSTOM_CSS = """
3
+ #leaderboard-table .dataframe th:nth-child(1),
4
+ #leaderboard-table .dataframe td:nth-child(1) {
5
+ width: 150px; /* Model column width */
6
+ }
7
+
8
+ #leaderboard-table .dataframe th:nth-child(2),
9
+ #leaderboard-table .dataframe td:nth-child(2) {
10
+ width: 100px; /* MSVAMP column width */
11
+ }
12
+
13
+ #leaderboard-table .dataframe th:nth-child(3),
14
+ #leaderboard-table .dataframe td:nth-child(3) {
15
+ width: 100px; /* MGSM column width */
16
+ }
17
+
18
+ #leaderboard-table .dataframe th:nth-child(4),
19
+ #leaderboard-table .dataframe td:nth-child(4) {
20
+ width: 100px; /* MNum column width */
21
+ }
22
+
23
+ #leaderboard-table .dataframe th:nth-child(5),
24
+ #leaderboard-table .dataframe td:nth-child(5) {
25
+ width: 200px; /* Notes column width */
26
  }
27
  """