Merge branch 'main' of https://huggingface.co/spaces/dingliyu/skillmix into main
Browse files
app.py
CHANGED
@@ -84,18 +84,22 @@ def load_all_results(path='final'):
|
|
84 |
|
85 |
block_css = """
|
86 |
#a {
|
|
|
87 |
background-color: #DEEBF7;
|
88 |
font-size: 20px;
|
89 |
}
|
90 |
#b {
|
|
|
91 |
background-color: #E2F0D9;
|
92 |
font-size: 20px;
|
93 |
}
|
94 |
#c {
|
|
|
95 |
background-color: #FFF2CC;
|
96 |
font-size: 20px;
|
97 |
}
|
98 |
#d {
|
|
|
99 |
background-color: #FBE5D6;
|
100 |
font-size: 20px;
|
101 |
}
|
@@ -273,13 +277,22 @@ def build_demo(df):
|
|
273 |
tracker = Tracker(df)
|
274 |
|
275 |
with gr.Blocks(
|
276 |
-
title="Skill
|
277 |
theme=gr.themes.Base(text_size=gr.themes.sizes.text_lg),
|
278 |
css=block_css,
|
279 |
) as demo:
|
280 |
gr.Markdown(
|
281 |
"""
|
282 |
-
# Skill
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
283 |
"""
|
284 |
)
|
285 |
|
@@ -418,6 +431,34 @@ def build_demo(df):
|
|
418 |
c.change(fn_list[0], input_list[0], output_list[0]).then(fn_list[1], input_list[1], output_list[1]).then(fn_list[2], input_list[2], output_list[2]).then(fn_list[3], input_list[3], output_list[3]).then(fn_list[4], input_list[4], output_list[4]).then(fn_list[5], input_list[5], output_list[5])
|
419 |
else:
|
420 |
raise NotImplementedError
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
421 |
return demo
|
422 |
|
423 |
|
|
|
84 |
|
85 |
block_css = """
|
86 |
#a {
|
87 |
+
color: black;
|
88 |
background-color: #DEEBF7;
|
89 |
font-size: 20px;
|
90 |
}
|
91 |
#b {
|
92 |
+
color: black;
|
93 |
background-color: #E2F0D9;
|
94 |
font-size: 20px;
|
95 |
}
|
96 |
#c {
|
97 |
+
color: black;
|
98 |
background-color: #FFF2CC;
|
99 |
font-size: 20px;
|
100 |
}
|
101 |
#d {
|
102 |
+
color: black;
|
103 |
background-color: #FBE5D6;
|
104 |
font-size: 20px;
|
105 |
}
|
|
|
277 |
tracker = Tracker(df)
|
278 |
|
279 |
with gr.Blocks(
|
280 |
+
title="Skill-Mix: a Flexible and Expandable Family of Evaluations for AI models",
|
281 |
theme=gr.themes.Base(text_size=gr.themes.sizes.text_lg),
|
282 |
css=block_css,
|
283 |
) as demo:
|
284 |
gr.Markdown(
|
285 |
"""
|
286 |
+
# Skill-Mix: a Flexible and Expandable Family of Evaluations for AI models
|
287 |
+
By [Princeton Language and Intelligence (PLI), Princeton University](https://pli.princeton.edu/) and [Google DeepMind](https://www.deepmind.com/)
|
288 |
+
|
289 |
+
### This is a demonstration of the Skill-Mix evaluation.
|
290 |
+
|
291 |
+
Paper link: [https://arxiv.org/abs/2310.17567](https://arxiv.org/abs/2310.17567)
|
292 |
+
|
293 |
+
### Samples are generated using 10% of the full set of skills and topics. Click the second tab for comparison between two generations.
|
294 |
+
|
295 |
+
Coming soon: generation by more models; grading by LLaMA-2.
|
296 |
"""
|
297 |
)
|
298 |
|
|
|
431 |
c.change(fn_list[0], input_list[0], output_list[0]).then(fn_list[1], input_list[1], output_list[1]).then(fn_list[2], input_list[2], output_list[2]).then(fn_list[3], input_list[3], output_list[3]).then(fn_list[4], input_list[4], output_list[4]).then(fn_list[5], input_list[5], output_list[5])
|
432 |
else:
|
433 |
raise NotImplementedError
|
434 |
+
gr.Markdown('''### Citations
|
435 |
+
```
|
436 |
+
@article{yu2023skillmix,
|
437 |
+
title={Skill-Mix: a Flexible and Expandable Family of Evaluations for AI models},
|
438 |
+
author={Yu, Dingli and Kaur, Simran and Gupta, Arushi and Brown-Cohen, Jonah and Goyal, Anirudh and Arora, Sanjeev},
|
439 |
+
journal={arXiv preprint arXiv:2310.17567},
|
440 |
+
year={2023}
|
441 |
+
}
|
442 |
+
```
|
443 |
+
```
|
444 |
+
@misc{openai2023gpt4,
|
445 |
+
title={GPT-4 Technical Report},
|
446 |
+
author={OpenAI},
|
447 |
+
year={2023},
|
448 |
+
eprint={2303.08774},
|
449 |
+
archivePrefix={arXiv},
|
450 |
+
primaryClass={cs.CL}
|
451 |
+
}
|
452 |
+
```
|
453 |
+
```
|
454 |
+
@article{touvron2023llama,
|
455 |
+
title={Llama 2: Open foundation and fine-tuned chat models},
|
456 |
+
author={Touvron, Hugo and Martin, Louis and Stone, Kevin and Albert, Peter and Almahairi, Amjad and Babaei, Yasmine and Bashlykov, Nikolay and Batra, Soumya and Bhargava, Prajjwal and Bhosale, Shruti and others},
|
457 |
+
journal={arXiv preprint arXiv:2307.09288},
|
458 |
+
year={2023}
|
459 |
+
}
|
460 |
+
```
|
461 |
+
''')
|
462 |
return demo
|
463 |
|
464 |
|