Spaces:

dingliyu
/

skillmix

Sleeping

App Files Files Community

Dingli Yu commited on Oct 27, 2023

Commit

b054c5c

•

2 Parent(s): 82ebbcd fbc7c46

Merge branch 'main' of https://huggingface.co/spaces/dingliyu/skillmix into main

Browse files

Files changed (1) hide show

app.py +43 -2

app.py CHANGED Viewed

@@ -84,18 +84,22 @@ def load_all_results(path='final'):
 block_css = """
 #a {
     background-color: #DEEBF7;
     font-size: 20px;
 }
 #b {
     background-color: #E2F0D9;
     font-size: 20px;
 }
 #c {
     background-color: #FFF2CC;
     font-size: 20px;
 }
 #d {
     background-color: #FBE5D6;
     font-size: 20px;
 }
@@ -273,13 +277,22 @@ def build_demo(df):
     tracker = Tracker(df)
     with gr.Blocks(
-        title="Skill Mix Browsing",
         theme=gr.themes.Base(text_size=gr.themes.sizes.text_lg),
         css=block_css,
     ) as demo:
         gr.Markdown(
             """
-# Skill Mix Browsing
 """
         )
@@ -418,6 +431,34 @@ def build_demo(df):
                     c.change(fn_list[0], input_list[0], output_list[0]).then(fn_list[1], input_list[1], output_list[1]).then(fn_list[2], input_list[2], output_list[2]).then(fn_list[3], input_list[3], output_list[3]).then(fn_list[4], input_list[4], output_list[4]).then(fn_list[5], input_list[5], output_list[5])
                 else:
                     raise NotImplementedError
     return demo

 block_css = """
 #a {
+    color: black;
     background-color: #DEEBF7;
     font-size: 20px;
 }
 #b {
+    color: black;
     background-color: #E2F0D9;
     font-size: 20px;
 }
 #c {
+    color: black;
     background-color: #FFF2CC;
     font-size: 20px;
 }
 #d {
+    color: black;
     background-color: #FBE5D6;
     font-size: 20px;
 }
     tracker = Tracker(df)
     with gr.Blocks(
+        title="Skill-Mix: a Flexible and Expandable Family of Evaluations for AI models",
         theme=gr.themes.Base(text_size=gr.themes.sizes.text_lg),
         css=block_css,
     ) as demo:
         gr.Markdown(
             """
+# Skill-Mix: a Flexible and Expandable Family of Evaluations for AI models
+By [Princeton Language and Intelligence (PLI), Princeton University](https://pli.princeton.edu/) and [Google DeepMind](https://www.deepmind.com/)
+### This is a demonstration of the Skill-Mix evaluation.
+Paper link: [https://arxiv.org/abs/2310.17567](https://arxiv.org/abs/2310.17567)
+### Samples are generated using 10% of the full set of skills and topics. Click the second tab for comparison between two generations.
+Coming soon: generation by more models; grading by LLaMA-2.
 """
         )
                     c.change(fn_list[0], input_list[0], output_list[0]).then(fn_list[1], input_list[1], output_list[1]).then(fn_list[2], input_list[2], output_list[2]).then(fn_list[3], input_list[3], output_list[3]).then(fn_list[4], input_list[4], output_list[4]).then(fn_list[5], input_list[5], output_list[5])
                 else:
                     raise NotImplementedError
+        gr.Markdown('''### Citations
+```
+@article{yu2023skillmix,
+      title={Skill-Mix: a Flexible and Expandable Family of Evaluations for AI models},
+      author={Yu, Dingli and Kaur, Simran and Gupta, Arushi and Brown-Cohen, Jonah and Goyal, Anirudh and Arora, Sanjeev},
+      journal={arXiv preprint arXiv:2310.17567},
+      year={2023}
+}
+```
+```
+@misc{openai2023gpt4,
+      title={GPT-4 Technical Report},
+      author={OpenAI},
+      year={2023},
+      eprint={2303.08774},
+      archivePrefix={arXiv},
+      primaryClass={cs.CL}
+}
+```
+```
+@article{touvron2023llama,
+  title={Llama 2: Open foundation and fine-tuned chat models},
+  author={Touvron, Hugo and Martin, Louis and Stone, Kevin and Albert, Peter and Almahairi, Amjad and Babaei, Yasmine and Bashlykov, Nikolay and Batra, Soumya and Bhargava, Prajjwal and Bhosale, Shruti and others},
+  journal={arXiv preprint arXiv:2307.09288},
+  year={2023}
+}
+```
+        ''')
     return demo