djstrong commited on
Commit
76bf962
1 Parent(s): 11c52b6

expand references further

Browse files
Files changed (1) hide show
  1. src/about.py +53 -3
src/about.py CHANGED
@@ -110,6 +110,7 @@ g_tasks = [task.value.benchmark for task in Tasks if task.value.type == "generat
110
  mc_tasks = [task.value.benchmark for task in Tasks if task.value.type == "multiple_choice"]
111
  rag_tasks = ['polish_polqa_reranking_multiple_choice', 'polish_polqa_open_book', 'polish_poquad_open_book']
112
  all_tasks = g_tasks + mc_tasks
 
113
 
114
  NUM_FEWSHOT = 0 # Change with your few shot
115
  # ---------------------------------------------------
@@ -245,12 +246,61 @@ If everything is done, check you can launch the EleutherAIHarness on your model
245
  """
246
 
247
  CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
248
- CITATION_BUTTON_TEXT = r"""
249
- @misc{open-pl-llm-leaderboard,
250
  title = {Polish Medical Leaderboard},
251
  author = {Wróbel, Krzysztof and {SpeakLeash Team} and {Cyfronet Team}},
252
  year = 2024,
253
  publisher = {Hugging Face},
254
  howpublished = "\url{https://huggingface.co/spaces/speakleash/polish_medical_leaderboard}"
255
  }
256
- """
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
110
  mc_tasks = [task.value.benchmark for task in Tasks if task.value.type == "multiple_choice"]
111
  rag_tasks = ['polish_polqa_reranking_multiple_choice', 'polish_polqa_open_book', 'polish_poquad_open_book']
112
  all_tasks = g_tasks + mc_tasks
113
+ all_tasks.remove('polish_pes')
114
 
115
  NUM_FEWSHOT = 0 # Change with your few shot
116
  # ---------------------------------------------------
 
246
  """
247
 
248
  CITATION_BUTTON_LABEL = "Copy the following snippet to cite these results"
249
+ CITATION_BUTTON_TEXT = r"""@misc{polish-medical-llm-leaderboard,
 
250
  title = {Polish Medical Leaderboard},
251
  author = {Wróbel, Krzysztof and {SpeakLeash Team} and {Cyfronet Team}},
252
  year = 2024,
253
  publisher = {Hugging Face},
254
  howpublished = "\url{https://huggingface.co/spaces/speakleash/polish_medical_leaderboard}"
255
  }
256
+
257
+ @misc{eval-harness,
258
+ author = {Gao, Leo and Tow, Jonathan and Abbasi, Baber and Biderman, Stella and Black, Sid and DiPofi, Anthony and Foster, Charles and Golding, Laurence and Hsu, Jeffrey and Le Noac'h, Alain and Li, Haonan and McDonell, Kyle and Muennighoff, Niklas and Ociepa, Chris and Phang, Jason and Reynolds, Laria and Schoelkopf, Hailey and Skowron, Aviya and Sutawika, Lintang and Tang, Eric and Thite, Anish and Wang, Ben and Wang, Kevin and Zou, Andy},
259
+ title = {A framework for few-shot language model evaluation},
260
+ month = 07,
261
+ year = 2024,
262
+ publisher = {Zenodo},
263
+ version = {v0.4.3},
264
+ doi = {10.5281/zenodo.12608602},
265
+ url = {https://zenodo.org/records/12608602}
266
+ }
267
+
268
+ @misc{fwpes2024,
269
+ title={speakleash/PES-2018-2022},
270
+ author={Maria, Filipkowska and Krzyszof, Wróbel},
271
+ year={2024},
272
+ howpublished={\url{https://huggingface.co/datasets/speakleash/PES-2018-2022}},
273
+ }
274
+
275
+ @misc{pkgpes2024,
276
+ title={amu-cai/PES-2018-2022},
277
+ author={Jakub Pokrywka and Jeremi Kaczmarek and Edward Gorzelańczyk},
278
+ year={2024},
279
+ howpublished={\url{https://huggingface.co/datasets/amu-cai/PES-2018-2022}},
280
+ }
281
+
282
+ @misc{pokrywka2024gpt4,
283
+ title={GPT-4 passes most of the 297 written Polish Board Certification Examinations},
284
+ author={Jakub Pokrywka and Jeremi Kaczmarek and Edward Gorzelańczyk},
285
+ year={2024},
286
+ eprint={2405.01589},
287
+ archivePrefix={arXiv},
288
+ primaryClass={id='cs.CL' full_name='Computation and Language' is_active=True alt_name='cmp-lg' in_archive='cs' is_general=False description='Covers natural language processing. Roughly includes material in ACM Subject Class I.2.7. Note that work on artificial languages (programming languages, logics, formal systems) that does not explicitly address natural-language issues broadly construed (natural-language processing, computational linguistics, speech, text retrieval, etc.) is not appropriate for this area.'}
289
+ }
290
+
291
+ @misc{open-pl-llm-leaderboard,
292
+ title = {Open PL LLM Leaderboard},
293
+ author = {Wróbel, Krzysztof and {SpeakLeash Team} and {Cyfronet Team}},
294
+ year = 2024,
295
+ publisher = {Hugging Face},
296
+ howpublished = "\url{https://huggingface.co/spaces/speakleash/open_pl_llm_leaderboard}"
297
+ }
298
+
299
+ @misc{open-llm-leaderboard-v1,
300
+ author = {Edward Beeching and Clémentine Fourrier and Nathan Habib and Sheon Han and Nathan Lambert and Nazneen Rajani and Omar Sanseviero and Lewis Tunstall and Thomas Wolf},
301
+ title = {Open LLM Leaderboard (2023-2024)},
302
+ year = {2023},
303
+ publisher = {Hugging Face},
304
+ howpublished = "\url{https://huggingface.co/spaces/open-llm-leaderboard-old/open_llm_leaderboard}"
305
+ }
306
+ """