Dingli Yu commited on
Commit
b054c5c
2 Parent(s): 82ebbcd fbc7c46

Merge branch 'main' of https://huggingface.co/spaces/dingliyu/skillmix into main

Browse files
Files changed (1) hide show
  1. app.py +43 -2
app.py CHANGED
@@ -84,18 +84,22 @@ def load_all_results(path='final'):
84
 
85
  block_css = """
86
  #a {
 
87
  background-color: #DEEBF7;
88
  font-size: 20px;
89
  }
90
  #b {
 
91
  background-color: #E2F0D9;
92
  font-size: 20px;
93
  }
94
  #c {
 
95
  background-color: #FFF2CC;
96
  font-size: 20px;
97
  }
98
  #d {
 
99
  background-color: #FBE5D6;
100
  font-size: 20px;
101
  }
@@ -273,13 +277,22 @@ def build_demo(df):
273
  tracker = Tracker(df)
274
 
275
  with gr.Blocks(
276
- title="Skill Mix Browsing",
277
  theme=gr.themes.Base(text_size=gr.themes.sizes.text_lg),
278
  css=block_css,
279
  ) as demo:
280
  gr.Markdown(
281
  """
282
- # Skill Mix Browsing
 
 
 
 
 
 
 
 
 
283
  """
284
  )
285
 
@@ -418,6 +431,34 @@ def build_demo(df):
418
  c.change(fn_list[0], input_list[0], output_list[0]).then(fn_list[1], input_list[1], output_list[1]).then(fn_list[2], input_list[2], output_list[2]).then(fn_list[3], input_list[3], output_list[3]).then(fn_list[4], input_list[4], output_list[4]).then(fn_list[5], input_list[5], output_list[5])
419
  else:
420
  raise NotImplementedError
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
421
  return demo
422
 
423
 
 
84
 
85
  block_css = """
86
  #a {
87
+ color: black;
88
  background-color: #DEEBF7;
89
  font-size: 20px;
90
  }
91
  #b {
92
+ color: black;
93
  background-color: #E2F0D9;
94
  font-size: 20px;
95
  }
96
  #c {
97
+ color: black;
98
  background-color: #FFF2CC;
99
  font-size: 20px;
100
  }
101
  #d {
102
+ color: black;
103
  background-color: #FBE5D6;
104
  font-size: 20px;
105
  }
 
277
  tracker = Tracker(df)
278
 
279
  with gr.Blocks(
280
+ title="Skill-Mix: a Flexible and Expandable Family of Evaluations for AI models",
281
  theme=gr.themes.Base(text_size=gr.themes.sizes.text_lg),
282
  css=block_css,
283
  ) as demo:
284
  gr.Markdown(
285
  """
286
+ # Skill-Mix: a Flexible and Expandable Family of Evaluations for AI models
287
+ By [Princeton Language and Intelligence (PLI), Princeton University](https://pli.princeton.edu/) and [Google DeepMind](https://www.deepmind.com/)
288
+
289
+ ### This is a demonstration of the Skill-Mix evaluation.
290
+
291
+ Paper link: [https://arxiv.org/abs/2310.17567](https://arxiv.org/abs/2310.17567)
292
+
293
+ ### Samples are generated using 10% of the full set of skills and topics. Click the second tab for comparison between two generations.
294
+
295
+ Coming soon: generation by more models; grading by LLaMA-2.
296
  """
297
  )
298
 
 
431
  c.change(fn_list[0], input_list[0], output_list[0]).then(fn_list[1], input_list[1], output_list[1]).then(fn_list[2], input_list[2], output_list[2]).then(fn_list[3], input_list[3], output_list[3]).then(fn_list[4], input_list[4], output_list[4]).then(fn_list[5], input_list[5], output_list[5])
432
  else:
433
  raise NotImplementedError
434
+ gr.Markdown('''### Citations
435
+ ```
436
+ @article{yu2023skillmix,
437
+ title={Skill-Mix: a Flexible and Expandable Family of Evaluations for AI models},
438
+ author={Yu, Dingli and Kaur, Simran and Gupta, Arushi and Brown-Cohen, Jonah and Goyal, Anirudh and Arora, Sanjeev},
439
+ journal={arXiv preprint arXiv:2310.17567},
440
+ year={2023}
441
+ }
442
+ ```
443
+ ```
444
+ @misc{openai2023gpt4,
445
+ title={GPT-4 Technical Report},
446
+ author={OpenAI},
447
+ year={2023},
448
+ eprint={2303.08774},
449
+ archivePrefix={arXiv},
450
+ primaryClass={cs.CL}
451
+ }
452
+ ```
453
+ ```
454
+ @article{touvron2023llama,
455
+ title={Llama 2: Open foundation and fine-tuned chat models},
456
+ author={Touvron, Hugo and Martin, Louis and Stone, Kevin and Albert, Peter and Almahairi, Amjad and Babaei, Yasmine and Bashlykov, Nikolay and Batra, Soumya and Bhargava, Prajjwal and Bhosale, Shruti and others},
457
+ journal={arXiv preprint arXiv:2307.09288},
458
+ year={2023}
459
+ }
460
+ ```
461
+ ''')
462
  return demo
463
 
464