Spaces:
Running
Running
update 20240525.csv
Browse files- leaderboard.py +1 -1
- leaderboard_table_20240525.csv +1 -1
leaderboard.py
CHANGED
@@ -82,7 +82,6 @@ def build_leaderboard_tab(leaderboard_table_file):
|
|
82 |
gr.Markdown(make_default_md_2(), elem_id="leaderboard_markdown")
|
83 |
|
84 |
df = pd.read_csv(leaderboard_table_file)
|
85 |
-
|
86 |
def filter_leaderboard(dataset, timeout):
|
87 |
filtered_df = df[(df['Timeout'] == timeout) & (df['Dataset'] == dataset)]
|
88 |
return filtered_df.drop(columns=['Timeout', 'Dataset'])
|
@@ -109,3 +108,4 @@ def build_leaderboard_tab(leaderboard_table_file):
|
|
109 |
with gr.Accordion("Citation", open=True):
|
110 |
gr.Markdown(citation_md, elem_id="leaderboard_markdown")
|
111 |
gr.Markdown(acknowledgment_md, elem_id="ack_markdown")
|
|
|
|
82 |
gr.Markdown(make_default_md_2(), elem_id="leaderboard_markdown")
|
83 |
|
84 |
df = pd.read_csv(leaderboard_table_file)
|
|
|
85 |
def filter_leaderboard(dataset, timeout):
|
86 |
filtered_df = df[(df['Timeout'] == timeout) & (df['Dataset'] == dataset)]
|
87 |
return filtered_df.drop(columns=['Timeout', 'Dataset'])
|
|
|
108 |
with gr.Accordion("Citation", open=True):
|
109 |
gr.Markdown(citation_md, elem_id="leaderboard_markdown")
|
110 |
gr.Markdown(acknowledgment_md, elem_id="ack_markdown")
|
111 |
+
|
leaderboard_table_20240525.csv
CHANGED
@@ -1,4 +1,4 @@
|
|
1 |
-
model,
|
2 |
Artigenz-Coder-DS-6.7B,EffiBench,10,0.65,4.86,97.02,6.0,71.74,1.85,317.51,0.8,207.87,25.6,27332.76,6.3,38.2
|
3 |
claude-3-haiku_1,EffiBench,10,0.48,3.69,100.28,3.6,38.33,1.07,40.12,0.5,32.52,4.85,3524.68,3.8,44.3
|
4 |
claude-3-sonnet,EffiBench,10,0.7,5.19,100.31,5.7,73.52,1.97,539.82,0.4,248.98,33.08,48799.93,5.7,45.5
|
|
|
1 |
+
model,dataset,timeout,ET,NET,Max_NET,NET>5,MU,NMU,Max_NMU,NMU>5,TMU,NTMU,Max_TMU,TMU>5,pass1
|
2 |
Artigenz-Coder-DS-6.7B,EffiBench,10,0.65,4.86,97.02,6.0,71.74,1.85,317.51,0.8,207.87,25.6,27332.76,6.3,38.2
|
3 |
claude-3-haiku_1,EffiBench,10,0.48,3.69,100.28,3.6,38.33,1.07,40.12,0.5,32.52,4.85,3524.68,3.8,44.3
|
4 |
claude-3-sonnet,EffiBench,10,0.7,5.19,100.31,5.7,73.52,1.97,539.82,0.4,248.98,33.08,48799.93,5.7,45.5
|