diff --git a/.gitattributes b/.gitattributes index c7d9f3332a950355d5a77d85000f05e6f45435ea..0ed5bdcbdc79d57ce93731c9b9f401d17a23f69d 100644 --- a/.gitattributes +++ b/.gitattributes @@ -32,3 +32,160 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text *.zip filter=lfs diff=lfs merge=lfs -text *.zst filter=lfs diff=lfs merge=lfs -text *tfevents* filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/evaluation/generation/examples.4b284b84b20c4py_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/evaluation/generation/examples.4b284b84b30c4py_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/evaluation/generation/examples.4b284b84b40c4py_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/evaluation/generation/examples.4b284b84b70c4py_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/transformers/tokenizer.json filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/transformers/tokenizer.json filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/transformers/tokenizer.json filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/transformers/tokenizer.json filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/transformers/tokenizer.json filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/transformers/tokenizer.json filter=lfs diff=lfs merge=lfs -text +4b284b84b20c4py/transformers/vocab.json filter=lfs diff=lfs merge=lfs -text +4b284b84b30c4py/transformers/vocab.json filter=lfs diff=lfs merge=lfs -text +4b284b84b40c4py/transformers/vocab.json filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/transformers/vocab.json filter=lfs diff=lfs merge=lfs -text +4b284b84b70c4py/transformers/vocab.json filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/transformers/vocab.json filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b60c4py/evaluation/generation/examples.4b284b84b60c4py_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b84b10c4py/transformers/merges.txt filter=lfs diff=lfs merge=lfs -text diff --git a/4b284b84b10c4py/evaluation/4b284b84b10c4py_0_babi.json b/4b284b84b10c4py/evaluation/4b284b84b10c4py_0_babi.json new file mode 100644 index 0000000000000000000000000000000000000000..d0346821f4d509124258f4a36884c9477d69d312 --- /dev/null +++ b/4b284b84b10c4py/evaluation/4b284b84b10c4py_0_babi.json @@ -0,0 +1,22 @@ +{ + "results": { + "babi": { + "em": 0.0, + "em_stderr": 0.0 + } + }, + "versions": { + "babi": 0 + }, + "config": { + "model": "gpt2", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers", + "num_fewshot": 0, + "batch_size": null, + "device": null, + "no_cache": true, + "limit": 3000, + "bootstrap_iters": 100000, + "description_dict": {} + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/4b284b84b10c4py_1_babi.json b/4b284b84b10c4py/evaluation/4b284b84b10c4py_1_babi.json new file mode 100644 index 0000000000000000000000000000000000000000..820b85bc4031947026dc57a4070bf625570a948a --- /dev/null +++ b/4b284b84b10c4py/evaluation/4b284b84b10c4py_1_babi.json @@ -0,0 +1,22 @@ +{ + "results": { + "babi": { + "em": 0.14733333333333334, + "em_stderr": 0.006472199821615191 + } + }, + "versions": { + "babi": 0 + }, + "config": { + "model": "gpt2", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers", + "num_fewshot": 1, + "batch_size": null, + "device": null, + "no_cache": true, + "limit": 3000, + "bootstrap_iters": 100000, + "description_dict": {} + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/4b284b84b10c4py_2_babi.json b/4b284b84b10c4py/evaluation/4b284b84b10c4py_2_babi.json new file mode 100644 index 0000000000000000000000000000000000000000..b4052f743d7cf7ee397583a3d043d842f02ac541 --- /dev/null +++ b/4b284b84b10c4py/evaluation/4b284b84b10c4py_2_babi.json @@ -0,0 +1,22 @@ +{ + "results": { + "babi": { + "em": 0.2823333333333333, + "em_stderr": 0.00821966716987605 + } + }, + "versions": { + "babi": 0 + }, + "config": { + "model": "gpt2", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers", + "num_fewshot": 2, + "batch_size": null, + "device": null, + "no_cache": true, + "limit": 3000, + "bootstrap_iters": 100000, + "description_dict": {} + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/4b284b84b10c4py_3_babi.json b/4b284b84b10c4py/evaluation/4b284b84b10c4py_3_babi.json new file mode 100644 index 0000000000000000000000000000000000000000..75160b53bedb5b2fe21a8ef35e82cc70025dfd4c --- /dev/null +++ b/4b284b84b10c4py/evaluation/4b284b84b10c4py_3_babi.json @@ -0,0 +1,22 @@ +{ + "results": { + "babi": { + "em": 0.311, + "em_stderr": 0.008452819059344486 + } + }, + "versions": { + "babi": 0 + }, + "config": { + "model": "gpt2", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers", + "num_fewshot": 3, + "batch_size": null, + "device": null, + "no_cache": true, + "limit": 3000, + "bootstrap_iters": 100000, + "description_dict": {} + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/4b284b84b10c4py_4_babi.json b/4b284b84b10c4py/evaluation/4b284b84b10c4py_4_babi.json new file mode 100644 index 0000000000000000000000000000000000000000..d11cd77c79953b559b35f5b37b37f78b05e07d07 --- /dev/null +++ b/4b284b84b10c4py/evaluation/4b284b84b10c4py_4_babi.json @@ -0,0 +1,22 @@ +{ + "results": { + "babi": { + "em": 0.33766666666666667, + "em_stderr": 0.008635632828446824 + } + }, + "versions": { + "babi": 0 + }, + "config": { + "model": "gpt2", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers", + "num_fewshot": 4, + "batch_size": null, + "device": null, + "no_cache": true, + "limit": 3000, + "bootstrap_iters": 100000, + "description_dict": {} + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/4b284b84b10c4py_5_babi.json b/4b284b84b10c4py/evaluation/4b284b84b10c4py_5_babi.json new file mode 100644 index 0000000000000000000000000000000000000000..1ec302fd4db9c50ccf44e0d00763897f3c8b1c2a --- /dev/null +++ b/4b284b84b10c4py/evaluation/4b284b84b10c4py_5_babi.json @@ -0,0 +1,22 @@ +{ + "results": { + "babi": { + "em": 0.3554083885209713, + "em_stderr": 0.01591042834951585 + } + }, + "versions": { + "babi": 0 + }, + "config": { + "model": "gpt2", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers", + "num_fewshot": 5, + "batch_size": null, + "device": null, + "no_cache": false, + "limit": 906, + "bootstrap_iters": 100000, + "description_dict": {} + } +} diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a2f95df376c0d2a5e16c7b9c9eb5eb7007924e81 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4813014742136315, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.029298284790512823}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07814637483776633, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013388565211954557}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39367165732976755, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0052609219673642686}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12355058601433035, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001894994722809818}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03357663912471221, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007824220781305639}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18024451705008498, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037047453236374803}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05343668682534253, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011505936382800977}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07298923635178714, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011896452042006365}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3727466061438325, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.005005690787063604}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11573328163228513, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017001940430562083}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07168838309172086, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012342784180538735}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3612267886931813, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004790388470075587}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11322320217099578, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017394583047356308}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c52e43358315523a6c49f063db431579adce3122 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7255238696408423, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.053879561708253726}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1625223257514928, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005111682257014667}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.32599686697536673, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005056163504321368}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.17553593173895937, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004096195356643218}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.08437320166589189, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003472257493578088}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17009103545543425, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036595655247239614}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.08995358919930085, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00276677511793771}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.1443002602162733, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004479274553715264}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3023393609518485, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004598931367210058}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1575106385009677, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0035058149961314554}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.14870447627323272, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00462570655861519}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3067494379024135, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004650958784315044}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1613119682169033, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0036048812212870155}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a4e57f67e2d54cb5463e42a714feccc571172da9 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.8687128586366801, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04673010602404015}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.1701554452582214, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005107771330279079}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.355832019011606, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004884775439773983}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.19129452100187833, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004216273048303227}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.09088743631977127, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003444014418662031}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18939437656895264, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037355969446100823}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10058078270140805, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0029257899877312156}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.14879189467464685, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0043534563737425485}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.32802790773843415, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004479264764219749}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1700727632598896, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003579698843822934}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1549450062748448, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004557766264854074}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.334886885021682, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004545614262741492}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.17593789645790273, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0037452392698808686}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..b4d23f7731c819123dc08ab11c32063fe694b23d --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.976110601716665, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05147232952331574}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.17650374199610544, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005278588530178822}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3620490484768146, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004763724984545098}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1955261278048012, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0042687987276028025}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.09649007165425032, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003579903171459426}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1932492774677527, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036237451702642704}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10373196315248306, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002909773730879196}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15353988316234024, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004424257414579797}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3329632854608314, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004284658072005821}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1729686164923851, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.003539784845210468}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1606790115172626, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004723404323298352}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.33915285374439175, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004340341067923443}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.17904838371148374, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003744462902264531}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..68a87897ef951ef8f6b4c4e1f1c7b2e84a5e37de --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.0350167319929164, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08089511258341531}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.18224379597295554, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0054869315349140284}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3728518882868007, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004805363061413696}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.20005984608564545, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0043621938032114985}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.10200985474477063, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0037380638769571885}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20291177783621683, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003801448242387614}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.10839195425794168, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0030187532546412294}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.15805723338022432, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004637765426393908}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.341594924355393, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004322861765243894}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.17627371459053626, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0036366682681705747}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.16598914017637473, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004915957758353431}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.35013405773908396, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0044261493721537235}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.18370609844319763, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003859835340459462}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f0f3a6adcd9e51f54e653241d96b10c76bd45672 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 1.099500805669065, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05128274555498221}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.18895154801724418, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005525818321828389}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38248844776913693, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004934647163878857}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.21085477597688443, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.004537288839362036}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.10447278232108755, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.003746341946804797}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2070479482405224, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003822643707608457}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.11341187327748274, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0031174298961979667}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.16301359107525903, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004631366227638678}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3486223306539461, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0043860650726248295}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.18499664526019835, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0037604793276689013}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.1713978535792387, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00494124825637956}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3573153383883979, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004488735837365747}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.19265091926675612, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.003995741079720777}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..765798ac20718d50d5df30e4b374741c9080f15b --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1824848450703605, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002258769733514356}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2829504579856686, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002892378725128921}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.20438865109293125, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020542271239135474}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.043109912585657335, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009711440225665886}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06736443489887266, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015632414031077888}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.048105932388098856, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010139576129839956}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13644080096663336, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015842215640080625}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21853544620158255, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022785408725319403}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15441829967250942, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014514089251988502}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.16955964056676814, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002110604546495203}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2633994155788588, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027106937173640546}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.18999551527620429, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019185335839288905}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.439034811249811, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08814349202270069}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c6bc599b920e2472c7f5da08aeaa1362bd4849ae --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.27650295097853705, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00433037610306865}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.20123333179446745, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029592287408768563}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1817945339591683, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021379348675478974}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.07927146370780327, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028993886109516787}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.048713843049408144, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014696170848375373}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04414011089261056, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011864515717073022}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.22325969773232404, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0038282019630928436}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.15381843600559833, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022441425803852682}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14036723611181662, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001621088879287515}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.2620080990727989, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0041842438687289705}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.18922669116358481, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027816420778518647}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17107746115835645, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002004425675535598}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.592511832648172, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0883522873390386}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..704d9871ea99b7ed33f1623fa2f2a88ba4eade97 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.33293478487683886, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004638481088709241}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.20832991559189593, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002882384230492161}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.201455981397101, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002215864605685192}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.10981600440845445, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0032662143067739334}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0571749108797057, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014697451697197228}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.056871066430790325, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001341215790213451}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.2702435488101451, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004129606571484203}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1613125746864521, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022067815922600644}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1572901498332904, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001727626060232697}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.31764168504184737, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004542434958936431}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.19654070699277223, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027147097304651784}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1904207426584212, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020985538580578374}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 3.1897316776859443, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10383641450422736}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..09de5234588902adac78cd6b9d1500de11421c49 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.2993896407068062, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004961826525869491}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.17036445945014525, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030340761083348573}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17011994598152969, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024811944029056563}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.10010009650819313, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0032857461552203595}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04756100531684024, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014329928419246308}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04854258938628169, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013429745795374734}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.2477387853206388, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004400377182402362}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.13297516874095594, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023567485440671196}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13474954073077003, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001970359077922383}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.28541851433610155, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004807244705293582}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.16068089265916596, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028651117671434395}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16095317824352906, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023610481534614897}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.1373295852103618, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09657133458196947}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..db0afdcc330cfec223557011dbb8700f71c83309 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.10233602202490566, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003901148966833399}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.05690170219061377, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002261392037062523}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.05785530003387149, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002104739102006248}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.032881948765465734, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00214275596785197}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.015513277487513246, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0009900569977354416}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.016216361695071208, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009795250112890484}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.0857146344396996, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003416320759360737}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.0445264515835226, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0017587334889400765}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.046183940516235616, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016983322564463742}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.0972394371974616, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003756250172857945}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.05298521225905992, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0021031803096113336}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.054222605768747344, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001979311930128123}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.03779045940266729, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.00499486813251369}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..8b94c6d7a9f650e8441bd9f6a9d1c1da23813479 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.01666321917537446, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017144844493535089}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.009157687542181802, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0009736218557175297}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.00927977866130263, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0009046636518910162}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.005635566478053115, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009678519939045886}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.002607955654242479, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004157349477803617}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0027628200691328687, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00040474421977877023}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.014505480826312199, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015703654365691406}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.007377263181545838, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0007854353219556513}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.007640431942454017, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0007551641757705242}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.01613430616214765, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016859400230554314}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.008638145878204216, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0009157832781292763}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008819513768437372, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0008640055278148719}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 6.058866159905281e-16, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.3900117794994548e-15}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1e3336aefb3103c669775b10d4c268cdea589bb7 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 2.021544193176019, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04672525631492646}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3452949497006971, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031874336438570136}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.3412418289576795, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0034398228533816144}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.33225583490736194, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0030225097754752873}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.11855573943397561, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015761697052151904}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.12140620974140548, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018263607260067699}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.11599617848462068, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015886302807693743}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.24616297725036965, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0022797007734971847}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.24639726684479762, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025797032547250176}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2383281424265221, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002215264906335406}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3190175340171995, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002958732504531792}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.31764816538422297, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0033043767478234854}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3081149911342974, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0028594046078756815}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..3a1944380bd95ac36cafc96f9e04606597b10c51 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 14.53743726129001, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14445690934234265}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6082899833637005, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032135327715503183}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4939991587989527, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0031897368344663206}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5180906148683028, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024567692495659718}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2992841860287957, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0027535069501413525}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.24073848287899435, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023692738232853716}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.25244576500518445, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0021987704228017047}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4377558923516418, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030209364495319283}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3522118606318514, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0026145016755065214}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3702354270220447, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002229049797298906}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.49559037424824853, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031867294805906312}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4017134750190358, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002963390841940911}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4215085599639745, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024837056691902086}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5180fbce96678d479fd0aa656e969ce0ae85176d --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 16.6974233877375, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.2259702264159085}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6308114156673001, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0030515635455948056}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.5241737976358826, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029634534710997382}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.550751959150263, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002334628388103356}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3245854766100972, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002738959218334304}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.26676548563429314, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002350700363573182}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.28087700716585834, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.002229388349802515}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4599329987100549, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029633837519416856}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.38012920627255303, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002577942917596876}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.40000959435601263, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002278833446615684}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.52202474439705, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031213147774664753}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4336862446313041, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002861587766898658}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4557773932977128, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0024812907319972668}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a7462e3fa43221bcd7b7606385922297a1fef5d9 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 17.234863759565464, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10626094777357345}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6451638771759513, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0029145371412898314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.5273596630229687, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028796397050091654}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5604782743289571, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022490187814614418}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.337823399687939, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002721131963155123}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2741776446898378, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002401017670924296}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.29137647462406413, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0022566745277518207}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4713022566374456, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002890868676128115}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.38393681062737384, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025637744220680424}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.40840245354897814, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002267056969140555}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5372731680476394, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030240854085328223}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4392611204948281, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028130487549137095}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4667947275839455, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002424767456065824}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1187be937cac39e9a945210af71b221c034d662f --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 17.43221273186975, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14852992258132883}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6566667386405739, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0029901104310675994}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.5250310784733211, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002880579788531886}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5644088431191606, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022998414866846426}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3489715445596063, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0028379714911102717}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2759061577612267, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002418733555610404}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.29718267067971493, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0023174404504521418}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.48238946977859254, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030258886889425406}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3841163890326242, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025948324351265347}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.413398262443025, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0023490992885206218}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5493173554754809, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0031195526839171693}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.43936018496359347, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028421410516723516}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.4722659980511927, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002493574854840473}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ecf12e4c2170abe4a6c858addf3b369158e8a224 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 17.27987171682975, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.22299466307707344}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.6628915228196061, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002895062323071317}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.5218597939831594, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027835407580159314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.5661613833598578, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022266488649150696}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.3538900021766568, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002806480832935743}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.27471917389658523, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023266477815265104}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2990249691536151, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0022661493792424697}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.4881090745767031, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029641049977624664}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3820604186528641, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024902085041821334}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.41542888953754, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.002290321145556158}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.5555907001865986, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030782994957697994}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4369700778836929, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002723697352083028}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.47431838670472687, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002431375830473114}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_0.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..36899968134236e75daa35ada537e056df11606c --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.16091335382563132, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0023214839725675105}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.31192453482745763, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00431663840907332}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20154310340791382, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002503527086260468}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.030192336082604687, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011298757941540884}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06486203625582514, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002495687484786392}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03939889642394197, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014269911312081135}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.11804593952699223, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001705008234352379}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23090498894651582, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003262191317539296}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14814803620232633, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018194923690126705}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12345041061371383, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018404072547649245}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24335540258442262, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0037333681065596135}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15559873712369335, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002082741430413441}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.598333295912428, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04369181828078937}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_1.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..000d125086695de636730c8fddf337ac9923b58f --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1740287506077371, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0035762963549450144}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.23534981942590377, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003659738471811391}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.18440937659488896, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003013311852017229}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03131736257651789, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017657388713041011}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.03976502875447221, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001888187751012635}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03225325166687549, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016333078188436293}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.13323315845033426, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0026925290035192807}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.18196243615159283, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002782613837447707}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14145239281725078, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0022406116825912387}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.13483891468420867, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0027354596616931065}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.18482502398325326, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002947981471107514}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14336629014297197, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0023103743217644922}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3695546970670758, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11288065979583667}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_2.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6bde0e3676f54d3d615c126f23ba24f8deeb9c87 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.19985236655576322, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003978452096741706}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.243103956744537, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0036939855243832025}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20363897243347945, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0032917079133891604}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.039138232698124914, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002062532698520258}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.044204414475646464, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002004713309978894}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03868362872963243, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018516242073862486}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1506477774402608, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003020476793401718}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.18469817921156023, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0027972563470297306}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.15378100277488155, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0024750584853391777}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.15239590573770034, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030467162920539536}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.18749040242023876, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0029321410628762915}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15570322493810856, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0025139232679603388}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.7308730289259378, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.17770532210337478}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_3.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..b63d4a9d2dadcc57304148035edcc9359bf9e624 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.19589658794017453, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0039853906513849366}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.22849167295097247, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0038566308815145126}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1953341147235192, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.003349630735723747}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03625824703902077, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018314388825531765}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0410258003930899, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018846780449691557}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.035779638469116914, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016750996803778595}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.148688151900945, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003095918669053127}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.17399714292187934, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0029506577213898122}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1480464200642175, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0025456089591690385}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1509875423818125, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003109411289001428}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.17818678675083813, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003105658861483215}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.150857629725387, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0025908796219687017}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.6177421822314764, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16975721226529852}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_4.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..bd38c3304a06ce851a744976b130c7b70c913361 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.06152754510214762, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003813964694018243}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.060593832681025625, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0035841876676039335}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.055186415576932185, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0031944085309462042}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.011572977582773758, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012872321658089607}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.01149657270593299, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011931029906206063}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.010566772575448751, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010986586323403539}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.046781635255582606, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00298661745817834}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.04475132182365535, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0026420061653404576}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.041175984283283985, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0024057569727709742}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.04812651646509195, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0030363159363846065}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.04684919680777955, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027817704867131674}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.04268034684571005, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002476327367349351}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.21556427831831304, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05992392947727259}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_5.json b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..76b01f9db8be546e9534fc3afd5303d6cab9d7aa --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/agg.4b284b84b10c4py_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0031162728399716532, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008737460454355458}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.002628521163198049, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0007303851868588104}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0027771927477267732, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007722613879690155}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.000451588582831646, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00021783265095521171}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00036940260996864765, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00019380741759243087}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0004013828039517138, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00020138596141432264}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0023063072540261626, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.000636589500329542}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.001989261212241742, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0005658258080821268}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.002068253073845221, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005744934556807894}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0025476363697054154, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007118711755257363}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0021837068783855215, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0006187556981975251}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.00228235191573137, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0006382890720853227}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.1959919832512981e-41, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 4.418229601032825e-38}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b24dd10f81ba04965dc7ef256d1c91451c1a56e0 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d075552527f0860f101cec64e9aeab118687e1a6d0511ce6627698fc7d79c3e3 +size 4191186 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e7e1dc8c6abb00f768f7e53722bdf66e1732d71f --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b015af073298fa4483488c06e4953efce99a9b00a226b0b01bb86b911cddbd4f +size 4632255 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4b389f4a1a746407d1dd5527f57629c0836b4b23 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0785e7e6f1e27d6823eeadca4fcba9d28ef8c6dcdec1014be1e0b1feca813ef1 +size 5587382 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e118458206e9a935df8eea9ea51f167eb14a63a9 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e6c473429791b3a42e0c57db43c2ce1255d20f431b4c44907dec23fe56118f2 +size 6502216 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0a1407062764688579efd65ccf07eee51bdfd7c7 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0368b462984991944c8d97c3798512f7d14ec6ac191c6f6cb69bc1b278c3512 +size 7406403 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7e8c8bb8abf0cce2301689c3c327a7b266c9d1fc --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f69a7062dd59e2ef059912cc4dc02d5029058f373ffa8ae7945af2ff81ef614 +size 8281798 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..61c257f0d000cd42ec36d0114a2f63059afde347 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caf5156f5867d5e75d57eb60c0d0ac66963c972a0d81a6c3f05b93938d6f84e8 +size 7653088 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5214a57157b2fccf0c6d9c058123cac75979fce1 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7847c818bb53ba2d2a36ccf2724ea50a2d526a5107d0b05a096d0f842649c294 +size 12972670 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..51ce3a5d77f4e706eeb37c170ff22a693f24c58c --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fda43c526a6497601488851eb4bedb4d9d853b0ea6fd4363c7037121b62d9d7b +size 18530083 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..47de48c4e82db91213d3a3984491d24c6e630870 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2a970fa4a53237662dcf851de5bd29fb1287f3e47f130681bd5d8f9af583a4f +size 23992252 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..21cea275f399b7461243ee41938871e382386d86 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c122fcf067cde14fae4afae6f4b4dc77d58c64e7be226418e7c1b374f3d287 +size 29359016 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c127ee0c5f16ebaae9c6d6c40edb81a02acf04e9 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31f11c9cb24d48535f58c6af9ddaaf1e13330352283a4a0fd7cc87318d091e10 +size 34782328 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bc8e4330ccb5b811d070c8353d6d9a92043140ff --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79f2ee013b7410a255d4eab8833fc0488829373937d6d9de7ab88f6ad0b9fe52 +size 4232457 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fb320e919159c1a180c42be02377824a6d56d55b --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b90ff3c6dbc6e3d479ef4bab0794131019a32fba591c0a22b25103c5e5c4d3f9 +size 5028930 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..49b490790f9917ea2e049ddde7b049fdc7c1e70f --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cbb0636e4bd469a5e10ffe5f18fabf733fc8ebc03ef01c792690ed182250d82 +size 6114646 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..88c9bee408391acb925d68250c31b9fb59bee860 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a666874c9ab081cb5bf92ca36c98497f87a47420176d3efa1b501e8d72588a9 +size 7187421 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cc5ea6e4cca638e0c2b8b9d18af6871dab44b90c --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556466d355331d3b3206e179c41dbe77552deb00d59e3d6f893843d00ca45385 +size 8259288 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..21250708ea72090038c142192cf2d127b5a147a1 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:493d1337a478a72815426b09a91f12b95ad4f200eb464ba4d8fbb54dc569e59f +size 9338810 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_0.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ad54bb92644c613800b629e1060dce0133cae596 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee15ad6e11ad366d10c202247dd43728c6f61a8cd52cec1b51e9c3f197401a49 +size 2787428 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_1.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5b2dc89bd19d8814718c90bd2808f7c6f2dc02c1 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80761393a7e7bf581d2fed59b536f0b46a872f7ef03df431ee5c0db2426b1f05 +size 4986747 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_2.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..853cd17bba626e909f0543799b74b577a48271fd --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0730f8d61dee7432f6b7f1c07afa18b3219aa514e36b55781ef8c4e4c891e359 +size 7238972 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_3.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f188076e1735f4611a1bf90eb4f3c0cfe26a92c9 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2832eeadaf5662418a4be49387dcc97e978d7f083048c29c963312d04f7ba442 +size 9510864 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_4.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..891db619075712274059c982aa901db668b84924 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74758f92d93b7685328f90ae4896e456c90eaaf8a1ab7947dcde44108623dcbf +size 11638928 diff --git a/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_5.jsonl b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0a9cb9aa64b59983d15acc1c84ebd548ab100bb5 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/examples.4b284b84b10c4py_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb168ef86f4fd069f59d0360f8d8bf0c0819909232833072bca85bba0b54882e +size 13897455 diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..abfd6783e65d7777a829d0d26601a79b96832e59 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4813014742136315, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.029298284790512823 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07814637483776633, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013388565211954557 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39367165732976755, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0052609219673642686 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12355058601433035, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001894994722809818 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03357663912471221, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007824220781305639 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18024451705008498, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037047453236374803 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05343668682534253, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011505936382800977 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07298923635178714, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011896452042006365 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3727466061438325, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.005005690787063604 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11573328163228513, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017001940430562083 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07168838309172086, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012342784180538735 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3612267886931813, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004790388470075587 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11322320217099578, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017394583047356308 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..fc8f8f470c088cbf25d58e3906297004c6279475 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7255238696408423, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.053879561708253726 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1625223257514928, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005111682257014667 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.32599686697536673, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005056163504321368 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.17553593173895937, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004096195356643218 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.08437320166589189, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003472257493578088 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17009103545543425, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036595655247239614 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.08995358919930085, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00276677511793771 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.1443002602162733, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004479274553715264 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3023393609518485, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004598931367210058 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1575106385009677, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0035058149961314554 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.14870447627323272, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00462570655861519 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3067494379024135, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004650958784315044 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1613119682169033, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0036048812212870155 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c49aff9a19e85c3471d8341c5f765c88cdd73b31 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.8687128586366801, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04673010602404015 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.1701554452582214, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005107771330279079 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.355832019011606, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004884775439773983 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.19129452100187833, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004216273048303227 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.09088743631977127, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003444014418662031 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18939437656895264, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037355969446100823 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10058078270140805, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0029257899877312156 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.14879189467464685, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0043534563737425485 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.32802790773843415, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004479264764219749 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1700727632598896, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003579698843822934 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1549450062748448, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004557766264854074 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.334886885021682, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004545614262741492 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.17593789645790273, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0037452392698808686 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..959c184d5008d12c0160560137c1d16d75bb1769 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.976110601716665, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05147232952331574 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.17650374199610544, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005278588530178822 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3620490484768146, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004763724984545098 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1955261278048012, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0042687987276028025 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.09649007165425032, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003579903171459426 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1932492774677527, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036237451702642704 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10373196315248306, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.002909773730879196 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15353988316234024, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004424257414579797 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3329632854608314, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004284658072005821 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1729686164923851, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.003539784845210468 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1606790115172626, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004723404323298352 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.33915285374439175, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004340341067923443 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.17904838371148374, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003744462902264531 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9dd7dc0b226133d6e5d23fb7e12cb1a3c325ef98 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.0350167319929164, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08089511258341531 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.18224379597295554, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0054869315349140284 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3728518882868007, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004805363061413696 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.20005984608564545, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0043621938032114985 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.10200985474477063, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0037380638769571885 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20291177783621683, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003801448242387614 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.10839195425794168, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0030187532546412294 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.15805723338022432, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004637765426393908 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.341594924355393, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004322861765243894 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.17627371459053626, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0036366682681705747 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.16598914017637473, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004915957758353431 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.35013405773908396, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0044261493721537235 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.18370609844319763, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003859835340459462 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b17fbecd828f58b5fd92878718443d678cc62bb3 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 1.099500805669065, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05128274555498221 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.18895154801724418, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.005525818321828389 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38248844776913693, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004934647163878857 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.21085477597688443, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.004537288839362036 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.10447278232108755, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.003746341946804797 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2070479482405224, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003822643707608457 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.11341187327748274, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0031174298961979667 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.16301359107525903, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004631366227638678 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3486223306539461, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0043860650726248295 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.18499664526019835, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0037604793276689013 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.1713978535792387, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.00494124825637956 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3573153383883979, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004488735837365747 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.19265091926675612, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.003995741079720777 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a1e06c60cfbb5545c0285d1f67ca44e23cfa8be1 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1824848450703605, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002258769733514356 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2829504579856686, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002892378725128921 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.20438865109293125, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020542271239135474 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.043109912585657335, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009711440225665886 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06736443489887266, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015632414031077888 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.048105932388098856, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010139576129839956 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13644080096663336, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015842215640080625 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21853544620158255, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022785408725319403 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15441829967250942, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014514089251988502 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.16955964056676814, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002110604546495203 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2633994155788588, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027106937173640546 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.18999551527620429, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019185335839288905 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.439034811249811, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08814349202270069 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..da77622b64eae6aa64a6bb462aac2031bbeb778e --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.27650295097853705, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00433037610306865 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.20123333179446745, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0029592287408768563 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1817945339591683, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0021379348675478974 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.07927146370780327, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0028993886109516787 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.048713843049408144, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014696170848375373 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04414011089261056, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011864515717073022 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.22325969773232404, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0038282019630928436 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.15381843600559833, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022441425803852682 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14036723611181662, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001621088879287515 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.2620080990727989, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0041842438687289705 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.18922669116358481, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027816420778518647 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17107746115835645, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002004425675535598 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.592511832648172, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0883522873390386 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4a59de33c2462add33f791dc9a9da9aedbc0fac7 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.33293478487683886, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004638481088709241 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.20832991559189593, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002882384230492161 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.201455981397101, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002215864605685192 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.10981600440845445, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0032662143067739334 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0571749108797057, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014697451697197228 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.056871066430790325, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001341215790213451 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.2702435488101451, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004129606571484203 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1613125746864521, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022067815922600644 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1572901498332904, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001727626060232697 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.31764168504184737, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004542434958936431 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.19654070699277223, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027147097304651784 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1904207426584212, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020985538580578374 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 3.1897316776859443, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.10383641450422736 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9c2cea92a0981e2db47d2d4426f8b7bdd74b2540 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.2993896407068062, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.004961826525869491 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.17036445945014525, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0030340761083348573 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17011994598152969, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0024811944029056563 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.10010009650819313, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0032857461552203595 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04756100531684024, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014329928419246308 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04854258938628169, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013429745795374734 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.2477387853206388, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.004400377182402362 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.13297516874095594, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0023567485440671196 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13474954073077003, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001970359077922383 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.28541851433610155, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.004807244705293582 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.16068089265916596, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0028651117671434395 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16095317824352906, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0023610481534614897 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.1373295852103618, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.09657133458196947 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e088489323cf5693daa508c290810083f23944ac --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.10233602202490566, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.003901148966833399 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.05690170219061377, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002261392037062523 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.05785530003387149, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002104739102006248 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.032881948765465734, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00214275596785197 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.015513277487513246, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0009900569977354416 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.016216361695071208, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009795250112890484 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.0857146344396996, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.003416320759360737 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.0445264515835226, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0017587334889400765 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.046183940516235616, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016983322564463742 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.0972394371974616, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.003756250172857945 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.05298521225905992, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0021031803096113336 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.054222605768747344, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001979311930128123 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.03779045940266729, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.00499486813251369 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..99af4740e740f9e0d62beaa2e8c9af2b9671e2bc --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.01666321917537446, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017144844493535089 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.009157687542181802, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0009736218557175297 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.00927977866130263, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0009046636518910162 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.005635566478053115, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009678519939045886 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.002607955654242479, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004157349477803617 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0027628200691328687, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00040474421977877023 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.014505480826312199, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015703654365691406 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.007377263181545838, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0007854353219556513 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.007640431942454017, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0007551641757705242 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.01613430616214765, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016859400230554314 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.008638145878204216, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0009157832781292763 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008819513768437372, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0008640055278148719 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 6.058866159905281e-16, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 2.3900117794994548e-15 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..418b02b8d8aacf5b189186b31278273886dc7e47 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 2.021544193176019, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.04672525631492646 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3452949497006971, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031874336438570136 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.3412418289576795, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0034398228533816144 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.33225583490736194, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0030225097754752873 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.11855573943397561, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0015761697052151904 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.12140620974140548, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0018263607260067699 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.11599617848462068, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0015886302807693743 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.24616297725036965, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0022797007734971847 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.24639726684479762, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025797032547250176 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2383281424265221, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002215264906335406 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3190175340171995, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002958732504531792 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.31764816538422297, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0033043767478234854 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3081149911342974, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0028594046078756815 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..038537a8e3837f14c67d565f5f56d824b709b149 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 14.53743726129001, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14445690934234265 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6082899833637005, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032135327715503183 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4939991587989527, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0031897368344663206 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5180906148683028, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0024567692495659718 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2992841860287957, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0027535069501413525 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.24073848287899435, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023692738232853716 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.25244576500518445, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0021987704228017047 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4377558923516418, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030209364495319283 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3522118606318514, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0026145016755065214 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3702354270220447, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002229049797298906 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.49559037424824853, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031867294805906312 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4017134750190358, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002963390841940911 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4215085599639745, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024837056691902086 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..192cdc88e72c3765ff619491f8e3850868f7ec2a --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 16.6974233877375, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.2259702264159085 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6308114156673001, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0030515635455948056 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.5241737976358826, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0029634534710997382 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.550751959150263, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002334628388103356 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3245854766100972, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002738959218334304 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.26676548563429314, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002350700363573182 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.28087700716585834, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.002229388349802515 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4599329987100549, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029633837519416856 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.38012920627255303, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002577942917596876 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.40000959435601263, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002278833446615684 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.52202474439705, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031213147774664753 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4336862446313041, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002861587766898658 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4557773932977128, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0024812907319972668 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c8999aa4ab3ce833690b408210f447637247ea73 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 17.234863759565464, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.10626094777357345 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6451638771759513, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0029145371412898314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.5273596630229687, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028796397050091654 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5604782743289571, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022490187814614418 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.337823399687939, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002721131963155123 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2741776446898378, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002401017670924296 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.29137647462406413, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0022566745277518207 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4713022566374456, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002890868676128115 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.38393681062737384, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025637744220680424 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.40840245354897814, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002267056969140555 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5372731680476394, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030240854085328223 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4392611204948281, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028130487549137095 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4667947275839455, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002424767456065824 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ffabcf93563dd6c3d429b65b6040139624ea9cf3 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 17.43221273186975, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14852992258132883 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6566667386405739, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0029901104310675994 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.5250310784733211, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002880579788531886 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5644088431191606, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022998414866846426 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3489715445596063, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0028379714911102717 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2759061577612267, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002418733555610404 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.29718267067971493, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0023174404504521418 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.48238946977859254, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030258886889425406 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3841163890326242, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025948324351265347 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.413398262443025, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0023490992885206218 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5493173554754809, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0031195526839171693 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.43936018496359347, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0028421410516723516 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.4722659980511927, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002493574854840473 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..61a38605a6f35dfd901aca8194fce50fcf216ac3 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 17.27987171682975, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.22299466307707344 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.6628915228196061, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002895062323071317 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.5218597939831594, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027835407580159314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.5661613833598578, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022266488649150696 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.3538900021766568, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002806480832935743 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.27471917389658523, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0023266477815265104 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2990249691536151, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0022661493792424697 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.4881090745767031, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029641049977624664 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3820604186528641, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024902085041821334 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.41542888953754, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.002290321145556158 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.5555907001865986, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0030782994957697994 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4369700778836929, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002723697352083028 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.47431838670472687, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002431375830473114 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_0.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1dec3770af9e19b3a8fae41ff379df273825ade6 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.16091335382563132, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0023214839725675105 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.31192453482745763, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00431663840907332 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20154310340791382, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002503527086260468 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.030192336082604687, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0011298757941540884 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06486203625582514, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002495687484786392 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03939889642394197, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014269911312081135 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.11804593952699223, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001705008234352379 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23090498894651582, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003262191317539296 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14814803620232633, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018194923690126705 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12345041061371383, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0018404072547649245 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24335540258442262, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0037333681065596135 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15559873712369335, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002082741430413441 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.598333295912428, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.04369181828078937 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_1.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7e99d42da75fc6f1bbda457027b1314d51ddb47a --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1740287506077371, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0035762963549450144 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.23534981942590377, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003659738471811391 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.18440937659488896, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003013311852017229 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03131736257651789, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0017657388713041011 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.03976502875447221, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.001888187751012635 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03225325166687549, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016333078188436293 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.13323315845033426, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0026925290035192807 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.18196243615159283, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002782613837447707 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14145239281725078, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0022406116825912387 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.13483891468420867, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0027354596616931065 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.18482502398325326, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.002947981471107514 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14336629014297197, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0023103743217644922 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3695546970670758, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11288065979583667 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_2.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a351a63b07f3642d0977e0d04b03c3802355fa8b --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.19985236655576322, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.003978452096741706 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.243103956744537, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0036939855243832025 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20363897243347945, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0032917079133891604 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.039138232698124914, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.002062532698520258 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.044204414475646464, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002004713309978894 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03868362872963243, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0018516242073862486 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1506477774402608, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003020476793401718 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.18469817921156023, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0027972563470297306 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.15378100277488155, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0024750584853391777 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.15239590573770034, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0030467162920539536 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.18749040242023876, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0029321410628762915 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15570322493810856, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0025139232679603388 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.7308730289259378, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.17770532210337478 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_3.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..bfd98878dac73e08308c0aaedd67a95c4134a96f --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.19589658794017453, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0039853906513849366 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.22849167295097247, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0038566308815145126 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1953341147235192, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.003349630735723747 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03625824703902077, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0018314388825531765 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0410258003930899, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0018846780449691557 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.035779638469116914, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016750996803778595 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.148688151900945, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.003095918669053127 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.17399714292187934, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0029506577213898122 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1480464200642175, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0025456089591690385 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1509875423818125, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.003109411289001428 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.17818678675083813, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003105658861483215 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.150857629725387, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0025908796219687017 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.6177421822314764, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.16975721226529852 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_4.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b379cb4ba5264fc7a6852c6f42f4430f2d5526c9 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.06152754510214762, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.003813964694018243 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.060593832681025625, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0035841876676039335 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.055186415576932185, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0031944085309462042 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.011572977582773758, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0012872321658089607 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.01149657270593299, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0011931029906206063 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.010566772575448751, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0010986586323403539 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.046781635255582606, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.00298661745817834 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.04475132182365535, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0026420061653404576 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.041175984283283985, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0024057569727709742 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.04812651646509195, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0030363159363846065 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.04684919680777955, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0027817704867131674 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.04268034684571005, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002476327367349351 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.21556427831831304, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.05992392947727259 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_5.json b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..23b875b6c49e5d54a64fd0e852ed0dbff3ecdb68 --- /dev/null +++ b/4b284b84b10c4py/evaluation/generation/slim.4b284b84b10c4py_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0031162728399716532, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0008737460454355458 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.002628521163198049, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0007303851868588104 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0027771927477267732, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0007722613879690155 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.000451588582831646, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00021783265095521171 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00036940260996864765, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00019380741759243087 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0004013828039517138, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00020138596141432264 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0023063072540261626, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.000636589500329542 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.001989261212241742, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0005658258080821268 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.002068253073845221, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0005744934556807894 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0025476363697054154, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0007118711755257363 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0021837068783855215, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0006187556981975251 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.00228235191573137, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0006382890720853227 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.1959919832512981e-41, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 4.418229601032825e-38 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4py/4b284b84b10c4py/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_0.json b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ac01b4b682a557098f22ac97fe67c6d7541802da --- /dev/null +++ b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.333, + "acc_stderr": 0.014910846164229868 + }, + "anli_r2": { + "acc": 0.338, + "acc_stderr": 0.014965960710224482 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311012 + }, + "cb": { + "acc": 0.35714285714285715, + "acc_stderr": 0.0646095738380922, + "f1": 0.19814814814814818 + }, + "copa": { + "acc": 0.68, + "acc_stderr": 0.046882617226215034 + }, + "hellaswag": { + "acc": 0.3619796853216491, + "acc_stderr": 0.00479590828258455, + "acc_norm": 0.44632543318064133, + "acc_norm_stderr": 0.0049609473885351 + }, + "rte": { + "acc": 0.5270758122743683, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5201262825572218, + "acc_stderr": 0.014041096664344327 + }, + "storycloze_2016": { + "acc": 0.6504543025120256, + "acc_stderr": 0.01102654800403797 + }, + "boolq": { + "acc": 0.6048929663608563, + "acc_stderr": 0.008550454248280895 + }, + "arc_easy": { + "acc": 0.5294612794612794, + "acc_stderr": 0.010241957728409686, + "acc_norm": 0.45202020202020204, + "acc_norm_stderr": 0.010212436978834111 + }, + "arc_challenge": { + "acc": 0.21416382252559726, + "acc_stderr": 0.011988383205966499, + "acc_norm": 0.25597269624573377, + "acc_norm_stderr": 0.012753013241244513 + }, + "sciq": { + "acc": 0.821, + "acc_stderr": 0.012128730605719111, + "acc_norm": 0.711, + "acc_norm_stderr": 0.01434171135829618 + }, + "piqa": { + "acc": 0.6980413492927094, + "acc_stderr": 0.01071173289158835, + "acc_norm": 0.7040261153427638, + "acc_norm_stderr": 0.010650414317148128 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_1.json b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_1.json new file mode 100644 index 0000000000000000000000000000000000000000..913d6cfe5dc509473dd995a0390acf27a80ebf89 --- /dev/null +++ b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.316, + "acc_stderr": 0.014709193056057121 + }, + "anli_r2": { + "acc": 0.324, + "acc_stderr": 0.014806864733738856 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.013639261190932887 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.06737697508644648, + "f1": 0.3373075012419274 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.3617805218084047, + "acc_stderr": 0.004795337009118191, + "acc_norm": 0.44234216291575384, + "acc_norm_stderr": 0.0049564940598648966 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5169692186266772, + "acc_stderr": 0.014044390401612978 + }, + "storycloze_2016": { + "acc": 0.6221272047033671, + "acc_stderr": 0.01121221988713706 + }, + "boolq": { + "acc": 0.55565749235474, + "acc_stderr": 0.00869070599067338 + }, + "arc_easy": { + "acc": 0.5429292929292929, + "acc_stderr": 0.010221897564256052, + "acc_norm": 0.5096801346801347, + "acc_norm_stderr": 0.010257860554461127 + }, + "arc_challenge": { + "acc": 0.22440273037542663, + "acc_stderr": 0.012191404938603843, + "acc_norm": 0.2568259385665529, + "acc_norm_stderr": 0.0127669237941168 + }, + "sciq": { + "acc": 0.885, + "acc_stderr": 0.010093407594904628, + "acc_norm": 0.853, + "acc_norm_stderr": 0.011203415395160336 + }, + "piqa": { + "acc": 0.6980413492927094, + "acc_stderr": 0.010711732891588357, + "acc_norm": 0.691512513601741, + "acc_norm_stderr": 0.010776164678037155 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_2.json b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_2.json new file mode 100644 index 0000000000000000000000000000000000000000..05f192ee575fd9f8511bb8804f93b2113548e1dc --- /dev/null +++ b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811473 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.01489959724281148 + }, + "anli_r3": { + "acc": 0.3258333333333333, + "acc_stderr": 0.013535422043417462 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3268398268398269 + }, + "copa": { + "acc": 0.64, + "acc_stderr": 0.04824181513244218 + }, + "hellaswag": { + "acc": 0.3599880501892053, + "acc_stderr": 0.004790155370993451, + "acc_norm": 0.44911372236606256, + "acc_norm_stderr": 0.004963872936857939 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5240726124704025, + "acc_stderr": 0.014036189665395134 + }, + "storycloze_2016": { + "acc": 0.6264029930518439, + "acc_stderr": 0.011186849693644696 + }, + "boolq": { + "acc": 0.5559633027522936, + "acc_stderr": 0.00869010521492079 + }, + "arc_easy": { + "acc": 0.5429292929292929, + "acc_stderr": 0.01022189756425605, + "acc_norm": 0.5315656565656566, + "acc_norm_stderr": 0.010239317603199512 + }, + "arc_challenge": { + "acc": 0.2167235494880546, + "acc_stderr": 0.012040156713481189, + "acc_norm": 0.2593856655290102, + "acc_norm_stderr": 0.012808273573927097 + }, + "sciq": { + "acc": 0.881, + "acc_stderr": 0.010244215145336662, + "acc_norm": 0.877, + "acc_norm_stderr": 0.010391293421849879 + }, + "piqa": { + "acc": 0.6985854189336235, + "acc_stderr": 0.01070624824275376, + "acc_norm": 0.6969532100108814, + "acc_norm_stderr": 0.010722648689531501 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_3.json b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_3.json new file mode 100644 index 0000000000000000000000000000000000000000..fc8692298193b7f213939b60f0453da541b4650d --- /dev/null +++ b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.29, + "acc_stderr": 0.014356395999905689 + }, + "anli_r2": { + "acc": 0.365, + "acc_stderr": 0.015231776226264903 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.013613950010225603 + }, + "cb": { + "acc": 0.6071428571428571, + "acc_stderr": 0.0658538889806635, + "f1": 0.4062342885872297 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.044619604333847394 + }, + "hellaswag": { + "acc": 0.36168094005178253, + "acc_stderr": 0.004795051037917719, + "acc_norm": 0.45210117506472813, + "acc_norm_stderr": 0.004966832553245038 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529117 + }, + "winogrande": { + "acc": 0.5122336227308603, + "acc_stderr": 0.01404827882040562 + }, + "storycloze_2016": { + "acc": 0.6344200962052379, + "acc_stderr": 0.011136758947688388 + }, + "boolq": { + "acc": 0.5663608562691131, + "acc_stderr": 0.008667690464344683 + }, + "arc_easy": { + "acc": 0.5370370370370371, + "acc_stderr": 0.010231597249131051, + "acc_norm": 0.5172558922558923, + "acc_norm_stderr": 0.010253671674754631 + }, + "arc_challenge": { + "acc": 0.21843003412969283, + "acc_stderr": 0.01207429160570098, + "acc_norm": 0.25597269624573377, + "acc_norm_stderr": 0.012753013241244518 + }, + "sciq": { + "acc": 0.889, + "acc_stderr": 0.009938701010583726, + "acc_norm": 0.875, + "acc_norm_stderr": 0.010463483381956722 + }, + "piqa": { + "acc": 0.704570184983678, + "acc_stderr": 0.010644731559342464, + "acc_norm": 0.705658324265506, + "acc_norm_stderr": 0.010633311470347519 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_4.json b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_4.json new file mode 100644 index 0000000000000000000000000000000000000000..de51aa089c894b013f4c6f636c7fb6ff0e8dbf21 --- /dev/null +++ b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928364 + }, + "anli_r2": { + "acc": 0.338, + "acc_stderr": 0.014965960710224487 + }, + "anli_r3": { + "acc": 0.3325, + "acc_stderr": 0.013605417345710528 + }, + "cb": { + "acc": 0.5535714285714286, + "acc_stderr": 0.06703189227942395, + "f1": 0.3502252252252252 + }, + "copa": { + "acc": 0.68, + "acc_stderr": 0.04688261722621505 + }, + "hellaswag": { + "acc": 0.3595897231627166, + "acc_stderr": 0.004788994060654276, + "acc_norm": 0.44911372236606256, + "acc_norm_stderr": 0.004963872936857938 + }, + "rte": { + "acc": 0.4657039711191336, + "acc_stderr": 0.030025579819366426 + }, + "winogrande": { + "acc": 0.5224940805051302, + "acc_stderr": 0.014038257824059876 + }, + "storycloze_2016": { + "acc": 0.6365579903794762, + "acc_stderr": 0.011122841442059708 + }, + "boolq": { + "acc": 0.5577981651376147, + "acc_stderr": 0.00868643052611449 + }, + "arc_easy": { + "acc": 0.5433501683501684, + "acc_stderr": 0.010221149650118182, + "acc_norm": 0.523989898989899, + "acc_norm_stderr": 0.010247967392742688 + }, + "arc_challenge": { + "acc": 0.22525597269624573, + "acc_stderr": 0.012207839995407309, + "acc_norm": 0.25853242320819114, + "acc_norm_stderr": 0.012794553754288673 + }, + "sciq": { + "acc": 0.895, + "acc_stderr": 0.009698921026024968, + "acc_norm": 0.898, + "acc_norm_stderr": 0.00957536880165389 + }, + "piqa": { + "acc": 0.7083786724700761, + "acc_stderr": 0.01060444152742879, + "acc_norm": 0.7007616974972797, + "acc_norm_stderr": 0.010684130673134581 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_5.json b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_5.json new file mode 100644 index 0000000000000000000000000000000000000000..61b3c11998751a7cd192722685f9dfc681c86f7e --- /dev/null +++ b/4b284b84b10c4py/evaluation/rankeval/4b284b84b10c4py_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.014955087918653607 + }, + "anli_r2": { + "acc": 0.337, + "acc_stderr": 0.014955087918653605 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821474 + }, + "cb": { + "acc": 0.5892857142857143, + "acc_stderr": 0.06633634150359538, + "f1": 0.365874363327674 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.04560480215720684 + }, + "hellaswag": { + "acc": 0.36217884883489343, + "acc_stderr": 0.004796478664403837, + "acc_norm": 0.4455287791276638, + "acc_norm_stderr": 0.0049600825288524325 + }, + "rte": { + "acc": 0.5667870036101083, + "acc_stderr": 0.029826764082138267 + }, + "winogrande": { + "acc": 0.510655090765588, + "acc_stderr": 0.0140492945362904 + }, + "storycloze_2016": { + "acc": 0.6419027258150721, + "acc_stderr": 0.011087006809925708 + }, + "boolq": { + "acc": 0.5657492354740061, + "acc_stderr": 0.008669116184243044 + }, + "arc_easy": { + "acc": 0.5454545454545454, + "acc_stderr": 0.010217299762709419, + "acc_norm": 0.5374579124579124, + "acc_norm_stderr": 0.010230952104570801 + }, + "arc_challenge": { + "acc": 0.23122866894197952, + "acc_stderr": 0.012320858834772273, + "acc_norm": 0.2636518771331058, + "acc_norm_stderr": 0.012875929151297065 + }, + "sciq": { + "acc": 0.9, + "acc_stderr": 0.009491579957525057, + "acc_norm": 0.892, + "acc_norm_stderr": 0.009820001651345694 + }, + "piqa": { + "acc": 0.705114254624592, + "acc_stderr": 0.010639030620156998, + "acc_norm": 0.6974972796517954, + "acc_norm_stderr": 0.010717199698083898 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d9a9cbaae99f61db2942eb07f23476c1dbd6cc3 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7870a88a02d32c626d22e002c76b02983614c74381ca6a1c08d731af82c100db +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9717a380433ae4facf4d3ff4c68288267a38756b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a65af58a1c2140d653c6342477183dee94c741b55e6d504ea743646b87cb448 +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84b2bc2d0fd1da0932fcc3b18270308e8ab6dfa9 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0693da37c402315a8f79233d2a3aa38b0a045b974fde48e7a521fed4036d360 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4e3094266118d2b6c39fb30e3897d1a82f6f768 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:652dcffd412cda26ed4281e0d4c8b9a35b4f3dbc82cf14b558b75c380a0c6956 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65f78c612802bca3354737ed635238c909c487c1 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e09d009ae8fdb09dff81ff896d3235aad93cdff1c8a7c6a0fcbe6db52368d91c +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..327dab851aafa90dcab5cfd686872d6570589749 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cdd9b58ec2b1f04569a72c3b86f4cf768d893d9c5b34c8a16c41c52fe709f68 +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f93dd3773f9c8002751097062105c2e99ba54d84 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f0bb6fd212a09e2532ae195837dd8d10351115dca5c4db512da047573506d27 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbced79bf27b9d9813f9cde24d890e6fb6ae0f4b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d35ca0a495e2b26de1f0e9c83da6ae6e3bd8964a56752ec3e51c0d3cda83195 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b782b0678f2da78ee5738d806271999ec2b524ab --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca0919d2fa306a59a07f669d1e065e8cfc8d94ed1028b2f21d51e4189ec6c1df +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a4434a5b5664b99341bf1e2771080b1e893ef5d --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a18a540d31da33ca7dbbb93d674b410db792feacc2ae89965e8bc88fa1277aef +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da5f465bd666f8622a45ba9f3cad627f52ff457f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f2d30d7cd7249af82078ecac83f1b9e94ec2c2d4d7e90bd5aafa6b41889c7cd +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69c7f1152c10007c6f58d0b02bbaaccacb0179a4 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d59654d5b2ac475c5e3553f26c7db991d5d16b12b565520f77491f922f2a705 +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9627353a98635b3c52951c273eaf3277158a7c69 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e789b52911c330cf3839c4e1df43c8d66d7951ce564a5c5cba778bed42aa8a8 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2303e91c525f5c2035ca62e92f610afdada0ab9d --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d5514e422627373cea5fdddcc9b2aa501962781e2c647b509fd1dba0b103d9a +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d5a2926a9545969e0900da5fa653e8fe7301c4f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f30fe325482c3f41c9232832a71a8afbba7b4e551c1fb3689a5e05e90d65813 +size 199058669 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c97439c71acf3ec035c74996ce18869a0b490fb --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:458c5fcc921abf6d556fe91390f4d669c6197a7f8b154f7933a82f2e8eba7dc3 +size 199058669 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72a0537fc1dbfae72d6bd6c0b169f768159ed510 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1997cafc4d198ebebd20cb27de2a4b0373518c259381abe3acd9edaccfc3dd8 +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59e3d163093ca30ab03351a269c146bef7ef28e1 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a2007efeb9b61a0d6dcd044cc84b0993bfa56bc217e2c7833215153b489665 +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..935c94291291a5431ed470221a543ef6fd2705f6 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fbf3bf9506860c99e04b592fd27350821e62b859fe454b2708b6225148399d2 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0bc8a5b236fabcccc8ffcb988869cc704bb6694 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c65580528870ee56f0994d802247836f19f2fff3388aef1a7e7fed2dbfd171 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f299d68898071e6a9fa37922b2d7acefa2e681eb --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:669b07a980ca2dc50dbca8eb73d533a0ccdd54ce2d314d438491d594c1f77e0d +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44c540238c7d9eeb50ecff2f9e447898786f4f36 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d3167b648e9efaf62d4bec4d1e5eb25bc5eb3a2d29fa9ea8ba57f43f8fcbd58 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af2e4c44d65f59592a5b6e3f4b6106907618afbb --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf22e885fba86a57658843fcffcdbede6b004efd35876d133f80463e38de3e19 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2916ec9ce79ef04c37be5f7c9fd0671937071e95 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a7f29e972a42d1d47d78a7f1610f9f6b930fed0c3dd32eeff5ce1f45f82321b +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dda415b782f2a5b1835428bd6589c5385a1c7bc --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7abf758cde76337d7e6ef87dd176046410727d5a9e63b8206395cd6eee576409 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1400581386b44f79d1d9b090c4e81fc240bc7985 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf0a406e55b06b4dc435c2b8dd36ce91bc9540e83d8b1afeffaed3b58a421fe9 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..615e0d8451ead3ec183e91c6da40bc2976370a0b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f77bdd5cc6fd249d98fa9bbc23327e63a772f4fc16a432721eeed0ec1d87594f +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fafabe68c4420d28000a32b05a56d18c8d63de12 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb9502b33fe90df7ebb9bb95131d2517246c60717e76599adbb721ed7e188b0 +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cce4a5d228639182363f72368bd8d327d57ce4c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04fe247470777e5a4341463081a892472aef8fba3b87f50a2999607d86229d0f +size 199058605 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6405bf0e774c647a9e519374f8758ac85d977224 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b4f04a29b42e3dcd94f4e5c24c810642c4d0409f239610d3d420aff556d273 +size 199058605 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0250a67f75b4b62b15bcce818475fe13e8fd2e06 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3647ae5b9d1c334062f164ab5c23fee97f961c6876382628b1a6b760f2e8d3cb +size 199058669 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7638276cccb9e935f1b72afb3688d49aba8cee53 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52fefe3cc9eb415f6dd43711755a51c0a423e7e2347b4c88db4c24759a804071 +size 199058669 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6de4589169c23cd7053ef8d360b8ae4231c44724 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dfa05e27b08f4259825d6be78e0f1eba6cd5da874c1fb94f2844cbaf7bbfae1 +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dba2f149ab001a156bff59feb601488f96174d81 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327f86abff384209a07f705e3abd62f2b4f7c4961927aeb30d358d99bd93f72c +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99e38b27026117691c51c677653a487441442359 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8f7e0b79eff33e9cfdb3e14d5d0f94afb78bec6c0e5624f3d265ca6abffbadf +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57a8088afe47ba6924d3f7edea83e662fe5f8a9e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0cb9a565e71f43d36cc563b8cc23373bc4ef095ad1d8ef7a33b41cc270c57ccc +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d6dc321f31f38091376d51dcd107db118a0e2b5 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df16d5396328013f6b61bd7753430c3249a11ca5df6696bc19efaa610afb46fc +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66c87b79874c21c0ee7cb1705116eb76bf70850e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77531cca7111a611438d906dbbde1bfcbf91a598780cb2c061a9b7552c4ce385 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10e75dd3c63714078c922efd867aafc12749cbe3 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:901e9fce812823436fa2455d03621285ad4eec122b865f89ef820921306cbc72 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..643c4d8dfe54af9e1866daff92714084873f84dd --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9e32dca828acf37754dfca000a496745667d7636afdf68fe1b0a3b01cbac22a +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc85f683c53b37ec3ae908e0ad32d051c8f48c78 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a336bae1a4557757c2ca38b641db2ce665d56fa5104b6e0c36baa1fe5e7d70b1 +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba1c69f26b2e4fab1d7686762752c8a24d1568bf --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:658ec5bd804bd3aa71a9eed6d6f46ff129bdd3847d47740c23c2dc716cf4ecb0 +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41787586b7a68ba8a99fa351541a66255f46a8e3 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9346b9e032201e7f69b484610f8addf2510df2fca65cdff1bf68f0b4aabc06e2 +size 199058669 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe9c723afd76f0979fae2055b217f1bff0e50db4 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5039eefd1756d61e9e5e631dfd443cdaa43587d56aac67d433143130da80d552 +size 199058669 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bcd8182f6ebfa524cdbf50ef6626fdc1df0ed95 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c76d520e776ed53bf969af491c31c1f96a1192595354bc9ed88f58d0dac3b63 +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8466323f655e046ae6e7e1247dbebcf61f3fb71 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef019837ea353893f9dd27711ca3310a5412fb8e7eb7f6066cbdd49468b3055b +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0e58876ba27efb4bd12aef9ad69631f7b4f2f5a --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62845d3d112fe9095f33d517ffe607675f73bfbeef2e0341906ed6a79007f791 +size 199058669 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c33b7bd793d8e7bfc228ecbeee91843b0556b29 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ecb07fa8d226ae65f7fdd1139e3af54ac0087a63daa031fad4ed4e3d77fd24b +size 199058669 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91a63d7def6704bb0f0fee8931ec7b0ffaf7cf36 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8c8498636fc83c49fdaddd0cf180d06c35efbab24dc70e3f3f684d86256894e +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b23b6011b9ace49192aa46a145c2756528463558 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a7826eca30abfa677af7f1a25011bfe2681f1f38919df9d036548fee3ebbc36 +size 199058797 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d72548597e4258014344c345c81e98820d407b97 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c77e9cd692c62adb5edd70b3bbf003a630ed567c1fe2990145e612936aadd778 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b2ccb28d3bc0b429cc08dd826aa327f2fa3b5c9 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91fd8b098300f51dc8b750c342dbfd195525d67f4f7d1362872bdd02fe67a1b5 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ce65adaf1cf945b56a44764f54b8b600a801e8c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de6c7919207889148ddd7c3673fbb81fe8dd5fec7fd70c4c6a5cd79c9c1db5c7 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..126b1c4f92148e8ba55cb1d1604ea5a31881a1d6 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a3317ff8efb2d5241a991882b5147f65ed5e9c206b81cf3e4d4c30fab31f3c2 +size 199058733 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e26e667409f50ba59d135c33b05397eb1fc92a96 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b32b2f04dd1b6f4c782a8fd0be92a4d316c49bdeb36092aa2d45e632032e9e2b +size 199058669 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..008fb1440f5c908827649a66dbe0662174dcd9c4 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b525b7dd72bede4be857e5ca8f31bbc4f2308bab8073593ee67ca5c1c276f986 +size 199058669 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec1a98cde4f4cc17f8b195e265904de12cb4d954 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac5907911c62211b4dc74caf6344accac8c2abbb6a9b431f5712d0408cf6fb81 +size 199058925 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c29ce11f88aa59d053f3b5681b97f1e93a952d0 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3536cdde3157627b264817a961f197fa7941b68530dd02ed215fbf0609343fb +size 199058925 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23d9458d34cf3b0d5d1da9dc93f06d02c027ac94 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5816e5d684edce98d91420fa98b3283b4a98ff34c4a12b3ef6a64340153b1f1 +size 199058605 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5534187ea11633e17ee80aa5bd4d9531a72981a1 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:951260f1007556f169a57ed6b704dda69e41268cb9c8f0fdb9320b3739ca55e7 +size 199058605 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da067a00027daa29c784e8a77234fe68d13777bb --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0730ae212ca766dbd9aa3567e7643b22c2bf193e401cef1d11815e177534d16 +size 199058605 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc8bf324ddde9f1d7e6747c90e4122e75d9d6c85 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fb4ebbfa772fc73f61e68ce9faa1d31a11f18c6adc1ee2cd8b6b13b1d1691e2 +size 199058605 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1b055025b4728e61fc873ac5453bb9af04a7737 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82bef02865f37a7dd6af31365253b632160bc5dfc5fd137acb777d4be25d7e9a +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3142cead2c303db76ec065f77781226a0883ab1 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c50ee8f7cd2466f45c1cf6ac7669e5bd51fbc297c1b4db98a036b92d7fd8753 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61611b60b8b9adf7d96fc07531b9112d54057cdf --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff147cd34cff01d4fc661754e88c17ce4b40f4051cc3f4c32056e3bf68f7b811 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93f1bd2e911ce99282a02c86ad287740d5ad0b88 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3338c38c45a39b2209c63eb5303dd7f28f3cdbcc8e93a912ae43f020bd6b7a10 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5826927b00d009a2bacafb9897d9ec30d1c99a3e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce69e188780b96300f2e30da5b36afba6e4b428123d13b4954e66bfc42a3420 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c0c096712a911b049a8c14adccb928fa503585e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50287a7a370b494a15935d6bd96aedd92eb6fb3e5520a8f26fa8c3ccbb329b9f +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6427cef259f17b5951c9e4963b489518cd475513 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebb38a6d5d3a7b453953a99f01607bfd01ba2a2e522afd1fa84d996899d8e84f +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6fb8fb367a87b80df50cdbb397c69938f9a7c0d --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf64a12e38f729d1537b46af606e8814a221b9cb2f534616c5794c52f3c1d8ac +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..caac40af47a61ee23497162235f9421f163b2cb0 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:180bf562533f32eecef4ad3140a6cee2b557883106cf063f8539d0ca97da25bf +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8df9b41218cff57c4aaa767915174107b3440fc --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a71a1f362b8c0c7f97fafb71d53568c2a66517dbbfdc09468fcb31d27c0f5a40 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..773f72f0dfb40ec4305e3abdf189deb74dd26fa7 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b05d07c43e3c4938f01aff485230be241e55c4df45cebfe09ffe8c484306a092 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c12d8f017657e32171b50120aad62b71a40aa29 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b139efd6049a164132304b94f31f79085accee3af66113c957f6ed31c560aef +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fe80bd0f297aebe8a4b2a5a82e5f05ad1d91070 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dd7485e894cf79ec0e4b456318631cf228c0adc92516820ec38146e1cdd30c5 +size 199058978 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c750a403fcb0d8d541295ce4c7195cbfd69588 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cda362a9f6cf32f1020f232607e53618043a45b231f4a581a81fbdd065c671bc +size 199058978 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1819973735904660a6596559bf2f5ba2e44556ad --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4b2340c6f5a9a6f112630e35af59cee3220443b46e0a59e576a6d8850be6bfc +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34ae04a5550adcb9d76ea2b63e4dc04a36c7f061 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0df4206991de9691f0b41bef6dd87b4d4a5d6eb74fffa4961083e90292bd5923 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c90f63e36c4b891305fbdefe896519c5fff6f61 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7058df15af77d498c00cf405c6894f20b976e4b3fbbd0f890cec897e4e03665 +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46d0456b3f1c65d355359c9f782668352bd0dbe8 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee2e14a87090856470df44c189b033aec18b399b12e7a9791e33c1f3f9b0b268 +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18bb2ba386aa4d919e9f69e873f933bf6d893b23 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:387c29626f176ba573144673836a8df2293b9696baf7cd3e34e76eb081e79254 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..786cf551c6d2cd6653910dd3f9780fbe7c5943de --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b08fcc3a99073ba335705cc97acd661f0624350d029cad7ee9c499957f43a524 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1845d1ab0c4f583f9ca76e9fbf1df3c34d2ad104 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7433e883e2337a0e2afd6ad8f92666181a627ac9f1c0608253c5eb323a0a6707 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf3a5acc0c3a9d90ee1a009c4943b648ed0b5732 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbab89997629abfffc93e5342314fbd0b36e4ac19e16e80697bdd37a6deeeaac +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f28fe0de515226c3d6b00cf8a3b4c1ede830b400 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50eafcec71fed58e2094c345d9d4aa9cc61fbe42ca0a9464f2179ebd503ccc5a +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c801f843d64b58945aae12dd214a19d0c678ccdd --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f27a369f58e8e8d7922a59285ab83d4a3e32e518a843309957557cd5af3236a +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d985eeb7effd3e1dc9f391fe9bb07a71ea47549c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2876c56ae0723eb8cf63ce9000e80876b4b4cce5942c5dca1d3e6166cd20a61 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6230a3596f632b7c2d1e27a9f065a795cad2c90e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3754bb982b3180751616d8b2b7a597a4c00c61e7c1711915a14e165cb0abbaf +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58bf8c41c382552d54b3db2ff5028b96f4723b04 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebc4eac02923f7775eee69f1e0a2016495c604ab774841266f30d0a18292790e +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f301ef8a2fa6135ccee3e8115002b78a61b0d2d --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17604e42a28587a3db38c1df2d7ec7a392d2520f933da97bf1a5c475e7f2218d +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfc26b99681e2994da2c6c0619f6450d985a8ca9 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5751faff78ecbb07c06f1b1a4431bed751277ad079f8cd501a08a57bfaf3a69 +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1ebfcb183d349bd7d7e776f5e706cd8649f37b0 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:610bc18a9fe343379b35c1af5191a404f720e62cc1b86da0066e261c4e75acdb +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..daaf4d89aae40e7481742bb9b30b3fc9a47fc3ba --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1ba952abdcd860464443227a7e80404845ebb46a0c79f4e65bd976b9e3fb1e7 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09bce5370b9538e12c10188276f5994c9c2ebb2c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a64771fa064c5b49cef075d21e9bee7ab446ae218262a774af79faf1be022ba +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..830ac91c93b46720fc8375a5dfc61b228c25b7ff --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2f1f3d0c221698bd50604ba06c7af0c438a4cc69c3c0f0466bab15f3edecd66 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4dc74a7e596ef705ae5f440c34ad767aa51b248c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2b206dd682d2eab7222b61dd4fc4a3572b3737cfe0f765b29f82a480a791999 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3653ada72df528c8b0d78f4b7e78c3e56a9320b8 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f981056aac00e461e111f6ca255eb7b96bef0f011e8d2e5cf6a28a5d1fe1fa0 +size 199058594 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceefbf797258ebd0792e0e80b641eb6ecc7e6071 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da1682f70a2071a59fe290f3f4980c124b0404b08137ddaed050021b5ee7861 +size 199058594 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fe771ffcbbf2d4d696b9165dfc67cb0dd2f4a5d --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4373f3abe600a7daf3199a363c0bcb22ee1e4b50b4d6214e2ec0967ec6d498c6 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb0dbc839765d02edc1916d093728863b3ac7a0b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c1e95b5636128f2aca1b2ac011b0a0d459050aaea103743f5aff51aede0666 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15e4275085e471eec64e68736342411a0383b780 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6da7ec672ae61b546f938668f6de4e29982ca633293416fe8bbcf70a8f22666 +size 199058711 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70b0c08a4dbfad8a02b70be36806865a580dc717 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c090b07af4cf3f04dc5187a7b778584658e6dd68a6fdec0e08493ea5cab5ac3e +size 199058711 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72a6a9776c6de7976daefba00f3ae44e27411dd0 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de572b649ba26134615a8b7bc4389ebba3e277c7f6ab944edf41743f0d6906a7 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d56756113d348724e2e2a19fbb61dceb2680f473 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a1b997481b296b2750816cef46158413aba5833bafe3680b6b3ddaee6c486b4 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca805ee0615de0bb1cb5638e89608f6f13b6a411 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e3b0e904769ee1d6e77b37111edb5625e1e864331bd3ceee2a6579f604ed28a +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36dcd75a0bb2c3250a378ffeec0b9a28a19f4b63 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf320e662731f3d13a0d2e295ec158e27bbf2287347b9e5c9881a77c92d563fa +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e88bfc87ba982cb615a89b4716e15710be3e8fbf --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6575d21782e581cfb0d3a8cf2d6d57b26b1367cabdb536f6160f97717ea360fb +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b01644e4d020b4e483155215d806e5b7c6a687f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f33c7c875595783b457be58a1aa58d75613208c36d794706364f22acdefb2f0 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5bc1c6095d5284a08717d7769a92349f58a1254 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27de83ab5a4e372ffe7d7ecf93a0966bcde93b6a5176e79147990b6bc22f8bbc +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..498de89423782b3669fca1dc0831fcd3936a09e9 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ebc60179e0f8470ed11ab3971580f274c64d277d87a5aaa4a1d7b72b01b8b67 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87955da48e3ddfdbd35b486940084c7c519a526b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b0cad675b26428251474d9239056d355f67d85f3cf69f67c87cce7bbea327f8 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2c324e2829608f77062e5f5faf08ff17d0cfae5 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:624d464c6941a4f0ff0f11f1ee92265c08a85d643bf752b726684b9e44356243 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dbeb20229b56e200a18320f54af8fc2b710d6ba --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e83fd7a91e6e50fd9f2b24a043f53825b6e7b9f6270b3428fcc7b1a39f06544 +size 199058594 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..251d10b547232203ddfe1e83e969c4592926f183 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d419bac52b47da24ddf2d89036b3e742c5707b813841f9a1af9bde84bba2779a +size 199058594 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f92be1267dea7e9ae683e5a33fe1acd7e00c65c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e96e74afa5ec9d779f89abc0c88d7c1e3382373d45cda794921d76a9f80c2c6d +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b59fdb33585710325fa62f652df84f44c3de3039 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f65758a9f28b3a485fb7842ca8440087451f3861dfae99d3b030d8ab3d5774fa +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44a656d70b4e38fa4ff787970f5cb6182b072e47 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7222edce41dc89a5f01daf85da50fd53f686a9ab99268c9654ee19f5b1af6b83 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..874c7f9f55bf4986dc755aabee12fe5dd1658626 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:829a671ec173c6b2479c10cac68276b1c6884f35cf05baf18441b75062b89a09 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..835c052cf97e5f59276f34cb7f0cee62bd70bd87 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ae198842712fb7dd747cabf2a38aaf152a0350757597e1f3e7f97e127b78470 +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0fb42191440ab71cae70191ea11e1d6d2a2a1ae --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2abd643bc2217b1df0bb7dc3fd6e5afe6998d929e3ef16ee7a1f69b6394f72b +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..144cb615d9e740961e7cd3c404835cd19cecc894 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7a47865d5c22d77091b1ece8b541da94f6679d683ab486989f8c7ae2536ca4 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ef6c4542fd99e8375a6cfcb37229be2c7a3a7e7 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1231de0a37a62eca705c59dd2e7e6510285a67cbaa7247922ad743a22424c8f8 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad60e63793e6dcd8a06916207d2e0100f4a8af1c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98c72b3cd374a9201a5a4b531aa64e53a832c4cbc93f0f586431ae117c2b334c +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbe50351519db183093be2f7197cc0aab1f9dc80 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15ccd6ccc4b0db79f88f963a24bedb2da20bbea7ad7f08e54dea0681016c4763 +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..198b77c0e069263f61e6e3af8f4cfe9f3e1f1c0e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb3f3b4ade07ae4a425a48c05348a6463ec359ab3e92c1480236d0314c09c4de +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9587fa206493e24fff1d1b3d2926211d2ce4ba2 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08861a73f29a8dbc77e342bbeaca4914af388c207cb7d5488996d02d5ed87ead +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0168d366aa05b87b662e634b97ac528a15040a3e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b86c8efdc41b7e843f9a5752fe628c39cae4c920f2e236ef22a3e67ca1581cb +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dacdf694123545d3e45b6312e05b58d653d8b49f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ea84b8e7731cc8e72d2a85308774366859a2e0bf2f0cc7a9eb6a08f79e5a050 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62df1d5578da729670dffa67ac3a8eaf17f347e1 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920529289b9f4ec35b325236c6b55b0c685529b1d2d3dc99588a76ff4092636f +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..109c65657a0317d233a540ad18f013b9f888e88e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d9226796bf3198bcfec4277f56f23fa67355ea0b84da66ecfef38cc41c88a03 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..644bc66e4b626593e7585b692c4ca4b7fc8954a7 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab4b9ba0eafe7f08297b854c7667028a1fccd1c92f98b90d9d87a189e80556ba +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1656eab21548fb7e127dfdf4e4f6ddb1a15c458 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47fbc3d8422dc0e60fc9b871c3753e1343c31aa12209d51e9e1311f9007a19e6 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90fb310c7c85d07206e1bf79e1e1d61367c60f65 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b9b541bc49a5f489ebff5c51d593d176bee4fd1e05430ad58d675ae1d431663 +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e80e922d9890c7e2c9277ed29698ac9788b8ef9d --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd3f18254d509d3160b428ed44a30e29c315508869c14faeef9968ac26a0c1bf +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f34326d7b7d40d9006a2e91b011b66ece86dc086 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae482f3cf2c9a899a9abf89500701c8ca211066202dd4ece6fd356667a46409 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d514d43aa716ef03b89828d9fa1a0f5b4ed68a9c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c03bf13c31e60dd1333a69ef5db6c150af565d88d0f0f99545c28a52b0206aa +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bded76f6d02a606d57fd4ebcad6344d6d0f120e7 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e683c8cc4bd71c122141408cfd9cf47a31bf5a985d1a8362df33bcdf93d6f41 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..388b4fb0952237a50d84b7a53dbcd252bb457a54 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6dac517b9d37fbf7bf3755dd03139927d3b8a092e423336a1c7f7be689b454d +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d7f1debe933d6399ce53128ee6d971edf3ae9d3 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18fb898c7ff174fb134f665493ddf75b8848d57f1bf05f7b5628613ac8071d80 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5455ee28d3ae0de89a8603c6e97e33c70c1ace33 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c445cd971e6964bdcb8767321ccb47d541cf9d10f35bfad91d5de4e7a657ba4 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f7b5139dfd0c9faaec1bf72dc044dc573dc29dc --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ce246c06f11641662a1d0340c93ae07751305ece3b26901323ab5fdcd2af55e +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6abde61ea315c4a821f10f19e1034496b1bf3d3 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:494c40c727f6be0fec00bb22baa7d5c9efeaf2133b73a3816aa3e0712d9d0e5c +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e283666d792e27849a0de0c29b0073a3d65fb49 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bced13d93607f0db62b64b7476ebdf7868c9ac1175d8a80984d641fcc54be5fb +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd8b9ac6b094511e559bbab636cb937a789ff5b1 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b354bc215b754ace911cc726fe7b83398881a210b2bd71454e5303550f13c1a +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1accaefb671fd203f567c34c70b16d3f9d2bd59a --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92ca759b72dc30cbc6a0e0a6da75ecd4b5bd9e9313bc0753f076cc7ca29365d6 +size 199058775 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..056a99bbcd6eab29a8eabffdc5ede13a3c3b5781 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:466b14645042217bb223e983aaa69b99ae35f3ca0ac3534b88fa13a729236156 +size 199058775 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd32b5835451b7c8ea68d322554c74f4f79da1d3 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e36656ad7b0cf0108f839b21b2bbfea2848c49b15484b75e7dffc147b670bc2 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b547457596c8d428b617195cc085fe3bc44bbcf --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f6b9d974f17af5c19b1400ce2e0b165358c93ed41686e77e2b3f0205385ac04 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05571464995dec3273f0202d8819b5ec64d6924b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e6589ee3093a12d4746a4228454cde99ee31534b05cacaf228985aae23c1db6 +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e5dd90fc25cb55cd1709468057f6867f98873e7 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:191ca7d077b8aa3c6d8a476873b4e2ba7699802d743ace80ab8855e2f527d12c +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d358b6725144abe96c484c24e774ff65d6e5e70 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bb0d73e774d2bfef8cfb601ed62aeb7505e5e70342f80473afe3b46bea75211 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44ffc57dc25e639d18615a3269b2d1a309336ccc --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba3d6bba6bef2e1ce3160b9a16686f908609e5369bb54c6c86f8f3eb7816a937 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfa298e5c05aff7f62d749d951c55341f5294397 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58d1c7bf46eab0fc2b80ef49b446587ed88a318c24dd0e26f7e094641ee65862 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1aef65ca259d6075e77996da56d6e708d9da672a --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96bdd2499557810e6b74893ec6c149a5c60834637b8515c9ef122d1c92f9ee8a +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef44da73a8a539663e1b118b1b99fc47949cecdd --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d56ac5d35046289090c16c74f1d8c3a74441e05e84e051652f09f52fea7b0cfb +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0159b62f2ad3b1d8cbe42123f347a209155a7b97 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d5462f40ca4d7e04f5d0eaa1a2a77169be78c1ce747f948c5039c38fd8b995c +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8a9dcdac38b7982d44e2757cba9debe3a6594cd --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3659deac6ea580c703d07df48e58c8777383c76f7004f710b1d98802fb95bf2 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83b753099822ebbcd5ed02715d483029c42e73e5 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d12cc9a5d41d7e117a496072c58a83cee4ae9ef4b99dab7de1de1dbb8cc269c7 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c0a7db1ea556d35705bafe9a919e26b97fa9fd0 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31d886c0f8d5fbdbd1d1dbdc8b1cc955f21b8cfc584dbe4e63cc24a650824498 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78c6be056ba88a91fac6b3e41cf7e5b51034b3c8 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e399e3e70b2ddd304ecf12c59c3136d04dafab4a8eab6812dd0f1044d60a74 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5add359ef7daed24e82717fde5f198921992ca91 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d559d2b6ce8d1147fd948d32ed8096f750a9defdd90cc550fc7f9271d0e242e +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ab614d7e76fb6b320bcc4877f4823b245b2fa6a --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:479d7a4fa77213f72c3d36c5c62595722c57f1fae64a307ea9ac47c324308945 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f03fe8e0814c74b87565f02c8bf1f527c923f00 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbbf8956327f6d0909ea755a4db2335b1628641e3d3d8ec1b50351a8a344ed2c +size 199058914 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..519c74e06ff345a62b407559d02b7a5af3695f31 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e3be59d4c05f59d7c118946be3ffc1486298fb516798225cf08db21f04fe8f +size 199058914 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b65c4bd95a366049bb7bdd4c3d893d74da2c00c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b294997c09f37ed0dba3afbc060bb608c98602fa1fc8fbea7045b9e6f4c7cf0b +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0b10af44c82e82f0917c21bfb6e95d964942f22 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3890c0d8d55ee9d53a39de8d1f6a8254a20cb1483c23d25ebd36663b1694d2a1 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c787a4b5be6b31f133153afe1a53a737d69deba --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f57db3d7e0154168da6f4b629a2300ea96f243f8f911efbb4ec19b0b3ab638a +size 199058711 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3c95dabcded2cb7b5dc2c644deef5f598a355ff --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fab78e8fa1c069c53f88865347664efa030ecbfda19c70cbd55e046c128606a3 +size 199058711 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18c2c36c943219c885a1a0914fb4fdf91461eaea --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccf772962b9b00bf6ad2f83e839667ff395cf4d6fee8f9b1c8eca3ff537295ff +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74b1cd4d48ca665ff2a9ec4bd6b611cfe61092ee --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab20be7036406defc4169dca4043aed88e10fa75149cedb9281b7ba08834eb6f +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65eb7351f90e789f8e319f6b6d6e516eac631949 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9885d365ec951dc4f7b8b057464e1df8cf738a997911a8969655b7a977e6afe1 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c070729e1bdfb873718335540a31500c319fbc3a --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64168edfdf1a84d7343f60456c9634bb215c1e822ec2373cf70dd7549d72f10b +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb852693b6ef03f3181ad7f97a4780c6765965ed --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:901bf35a3a1125fc97ca63eca974924c43cf0eac1bb05d1462731e5da3c53e77 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f843492f45aa8e87768c24f2d849c36e546856f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0781de44e304a1de06dbded7d6ef82ff563a8e2f5af7f95db11a7b3def74807e +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da1fc30e560b464a986dedf10f86f8b8c460577f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17786a6fa03cffb0cd522387b6cb175bea8e4e39517eb30936f50416ee1cc3c5 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6925f8bfe2d22b5105c8fdcd4bac48ff7fb59e2f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c9ac175fdd27ffc1d1dc6424644e62546fc865ae1f6d84b636c13a197335a74 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80d23252c6db83d317741ab05f03ee17bf781495 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:716fba97dd14e5909370358c3dadfe358e70d92c599f6c8d49db1032cdcb6a7a +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d8bb42fe770c606af99d334680ee3d2f63d8376 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15fdb80fae09a3e6bafc422e14b72d0159d31210f5832bbef4cfc00f0861e5e2 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e0243df4339eb683ac4e23d7b35f6a6acf7d589 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2262280efb48103d156add3f95c9dc64a87de48f724ab4271db82fd96517486c +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fae11969ad4fbac22c743f24622721d23cda5a7 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63c5333cac8cf01e4a43537a74c002eb773fb87f2a7de13f7f8dd72fa6689c39 +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cfd6f73e0d5d629fb524e71e90786a670cd24f4 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fe67dd7e8ca8f3a7fc47c7d04c4090ca2781f8b12f2a0f8e6a3f751409887dc +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f75ca75ad947a771fcb79669f6b152a1e7986b0 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3722e3e46140d581a6d613ddbb56959da6494673a889c0e557168b9c62329b0c +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5a83ce23cbff80e203686ea91c26add71717e0d --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa99e30096a24e4b7f1f3584d003f17015845ac40ab53adc0e6493d79bf14a1 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..813cbaa146e15b524aee2b198c97292df6dda509 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e54e87eae57896ad42964c18c737e02075dd728263eebba6a7fac29c01d5536 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63717be7d888dbbe62317866f15d46027c717ddc --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e44e01aab96c6b9621dc36cabbaf8c9d5d043ccc9b632437de1fbce0c9564a2 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f16696bf7a7ee686051caf2d62582debcd584fa2 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87be81bf48683f02757138d706e7227a71af0ca98fd1085eb6fa611990d3f497 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1815af6f9b5a09e6893efc98d84b7d9e761a35dc --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f43c87701c8886be535d80ab7ca2bfad54c5def3300d5087c8717d78df5972f +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75e532205b91bd51bda5908af65d217aee4b15ab --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0694773c929009578bcdae5d9aa9ed6a50ad66939bc7baa511d25a5ae8e4ac4c +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7763c99631421554ba7a944e76214bdbb10ff10e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6edd3c84ae0b581fc3a898e96e94914120aa3038e453e6a4b2ff4b4ae395a65f +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93a8481a4dad0625f9d33958b78bb756b50c9bf5 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc48867cb7c734749b96e91b7fab45805c3dfa8f875b10688eb8598732482e30 +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..145c9c4e67bad0f9529b838d9d8aec20cb04c048 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3de2dabda1a71c32f77af6ae9d5e63aeddda1f55bd0d0852f32963a87304aac4 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a0b465139b866bcc131e28c89950fbdd5586f3c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0ca8cea98ee5e7f33de4d0630f86773eae1d94b047e67b9029ff1dfbb4d956d +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5bfbf85e0171c113bf1157a0af2c2e4e7607c17 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07b454e3fc76b77e8d20d2f8fad438470a78f072d19576d074514c84fe00d0b5 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cca1e6120316abc94b09170579211c531491d80a --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d652e0ae0543e14322491a393dbd0ac469bd14c7e2682fc0665f40add29998e +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d137d44ec816ab36b0c187a8f36496a3808ff16d --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f81b2179acbf54fcd1f015b89c8fe104c2aa35e93e388d7e64a3b89dfc3973b +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cfa0f3f52faf3541909ed735bf6bf00af964925 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85931e1723d6c430f79d20a8f9cea7562d675e330fe407580d00c2450b81a856 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..122d58272b02b6aa946da6134b03ba171f7c12e1 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf75f087de93107ed12d11d2c15695cba3df66a108cc461a434d68ccbea6695 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f85179367e3e081b1525d5d507f80b300a03ad0b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2becea7d5730fcbe9afe8b5b39a17c3a088c02cc2085c462d263cdc749609284 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e99f702e8ca81b824fb81ed6a0ff43da608d2f2 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d84126cbe5f3dfb1fff1c09ab6705ad454e6cca9c653542242993d4cc0b46f07 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d50f61bb9ed40fed6a54abe425a4d4fc1f1e56f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04285cc781fcc13fc306a5642672eae32d18122e54e53e000b5fc0648c5be93d +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6e6dd52ea7b08cc6cf311d22fd99effcc2befca --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9da851ba50756ff8eb3bb95339a152e18c3fc4e7211ee6d2d97258797bee39a7 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79073618f49585bb2788f4efab28b1dc0fcf8ad8 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b795302b78802811c766aabf2b7d161def048c775b3f28318218591d63c83b9 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d32701bb44a3b2f796297c65a64d0e547991ba5b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e0a31556c202fcd546b54bdf63c52d2afb54f9d280c563e3330e4d9e6ccaf31 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce1923f5d75744e4e4dd8bf1434ee466b8da58b3 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb8a3dce106e36b0b0cdfc35f12273fbaa69b28825677bb2db607f0f22087cad +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35e998a1a81fcd2040503d5a23f6f19af6fd5bb2 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f73700bcbf743b3d3dcc8e0fc6c4d2c18627fce51de8ec73b090463a3442b9 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..912bb987bdf1662dbad83069c6160bd92b7cad2c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e065dff6ca0c9e13fc51d2e0e83f81a073cb276d2006a29875b04f6db0f543a7 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89174f445771b10fa3336cf8413e3766d14cab5c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7e8e7edeeb90390a554a66a8d8e1c2430f8d8e5d8fba6970d08866f35443e48 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f81b709db6f621a62838be34f1eaf1063eae118b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca7ae18c108ea1dc0018d276648b8027fb3a3f6a94c0d9f86fe9020d7c965444 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..997e0dbad30cb4fa7c571cc7ab35c02895098f59 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:530ba39483765c9fcfd433c018b7655cb976748ad0d613c0c25e37ce72119046 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6b7c8ab48be7bb4ebea59dc8e76a74808d15d6e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910d599a5499c8fcafa23460a1f8cfebcb73b81d16e1ebf195cd16d442b074ae +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..684e5e8cbcb4319c73232380572e7127de1cf342 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7111e19f65c543904e952dc118f2bf0645dc0a7ec7b23729c48c159b8955cab7 +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72a720d7ffe68abfad40a30c15166a3c9c3ec4a5 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ed90afde595a0c0334b7690127bd10fb1cedd6dd605cd7ce234cd72042ed306 +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cd3bee1d92b64be145d3782d2d5d317a8e71e72 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:495eca1a6ae2936ef05d89f53fd3309a639a0eb3cffeab328cbbe7c557050d85 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9f8bfd1796df5acb8354f0eaf335085c70c1660 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0b0123798df40548b28b4facb16244cb318d3c58e321bbfa9b1f0f5f956c513 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b75a9e6fb1b20bd0267b436dc36562a5529f7e1f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70973667d6f8c93c8a580ffa28024f0eeb36732a1e401ab2a7a9a90ef7ebc1e7 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf5825080b71b805e8066228cf54a57d2dc00a54 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b739b2332546e0ed8ae893be8e23ab5953d3a4a63a72b87bf6d68ac305d03499 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61bad8a35b7d4278177b2e7e94322b78a64a5b55 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:246d428b731f2be8946ccc60a4f2d903bb1a805fedeee80a0d388c2d75a4f4ad +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..119cbdd75ac476f54db3e561aa8b663d1bbffa76 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef1d28a25c28d6002ce0207462e3f2a79d8556dfb4c2fed67dbb5efdba11946 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c665c3339fad49bf50ef7ad3f8d67f79421e47d --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:857df0b3d3ff50e1a314dadde73dcd7bac7987cf1c84416837f010ed0782e4ae +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d7155a82e30a358d5d96ecb98a7d052e5aa0122 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:510f24f5b39f2b4bcfc850403bd09b90a1f61c24585e850454ed8c603f156247 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bea4937f507200df4bcb2dfdc21ae55f5fb6049 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3383063f4386ab9ed3b6907b211f226b07423a21a1370b097a52d29537c5170a +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce992b6d6ddc22908ab7ee84f8fb4e4597d59bab --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64c2204781c758ecdaa75aaf490deecb69a9a061891c2bfd475a0310f28a71ce +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06620aa08e1adffadd330e8e31adead950f548d9 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e77b0ca081eb0ed9ac580ec4248690c82e0a11d22663651468757a111eec3672 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cedd5be685a2847a467b3af783f3e1f944a25929 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fe122ff6b53f15c29dc6ad2966b993a0675e9a337714d08602ecd81cadd479e +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85a870679a054e5bd496984f1139adc95ed11a31 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:836b50fb28b068a21f13b1e82a52b9a13ff2c519cf58cae0ca869ba3a0d072a8 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1b44589f4e3f6ed23156ed32b0c80a6fd5ef6cf --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0123e442146214a727c8afd638f59cd8b8cc8447e8c3d780a4fddcb9fc46dce +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2249c76ccf452454c47c5ecdf98817b73fd2cb5e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423cd078f7642ac5f4988b3822a900bea322db8f8b6eddd5b0ad3d6755060c79 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f72f9dddcb7ad8a94086689058e52108041e14f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45080a648a13b1770cee0456cde79014d430e17d21def4a790041a15475350c2 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc1373e67ef8add56073a93ecfa3f53a12732288 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:329b4d3109f017aae5dfa2b197ccb5a9aa7830bc265c4baf3feb79e095cc7771 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ced59b0f233d3162bf562592ccc007ac05aedd52 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60808c1aaefe00442140011cd97e6d3c2458d4fa7615d3833e6bd089ae0c5cab +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e25a6c274a4924342841a9b7189d1850ea4f2066 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:907afa8c2c3349226d3f1d825f0b9ddcc93d21a8d4dfecdaee0008a84f5866c1 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..653ac5a34ead517291eb38e245d47693de862ca2 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8696a0c00b7db9d48e4bc85531deae5cc41af7bf2c3e4eadf56ce835751151c6 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7df7f5e6aebe1177fc89b63491fd1c1e4f08d353 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba88bfbdb1ad90898a1a9b5cb492ec3d298d5d8923ed5c55bb54d2e6dbda9b18 +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd8c07999022b7c2c8bbd0286fe603b67795d65a --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bedc0070a82beda17667f268c0f7d0925272dafdd0402d8112b7aed1bbe9b7ab +size 199058647 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1b3ffd84024ee5769809b354bde0b4568631119 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5da4483c29158bbfc601c34611f46f8ae1229892a0e735bf6e4629b568f70aaa +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ee05c9e8606bfcfe6016f49c7ac4e58cabb4649 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ec4b9a6ebe2e424e72f82537c00a241be344b1e47705067f0f1cdd241c6cd48 +size 199058850 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13e93205a618eb5bcdd5a1106a775125f5e4398c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb8c7c8d9dfc0a9e5eae4e1f984b5d08366a7bda3e3d2620046ebe3ff58b9f0 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7cd1cf46c3df592af8220052687c704129a7bbb --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a612348e10a1972db679ebc555e05dc0faea58ca60ec0acc00b26d97667267d5 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca3c314447799ebb83a31b0e5e1daa95509a411d --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46a1d053493585eaca54ec29b95aaed62c996491c9be86d3d1aa34dc9e9315a6 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4362115f6860f2ae7b3ee98c3f5507f3ac31ce6 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d98e7a8e6d1ca673621db3d32525613f6f5c424e8acf5862907d02a289d21737 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cb05e5d9461586df32d405ad5778e5c8945e1f5 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f15bdcf63314ade7ff5ac14ffb03a34baca9865cd8ac264c727be1d0c92785e3 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24ee7b02e64b9723ee0b956ae6764d0621eaac57 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fee7c22225a714fc3f15fcebd8a546f5e8d2355640e3ad8c821acd42d84d8cf2 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71962e25db3e639430d496b06272d977fdfd4e28 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:010ac0543ba567a4b6e02acfa7bb78979f93aa65d86fcf8c7239cd26db72157a +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19ac08a802d73edd7c002326eb311ebbf88bc37e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b0db55bcb7a268534b92b997f97fd7499cd88a918b35c4c57c09303df5ca078 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f7e70c0d5b29abdd2c02263e013992364a18663 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2988c7312f991d624ddfb3814e3141198825634b916db52d11393370633019f0 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b5bfd84054da9b4fcc819b12001102c8264f4a2 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a83266cd02e57ac47a888c8bf141db97b66f8b99367ed33f697870a61b338ac1 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac8748507e1e5b221ca2ad0d096d3f55176018f4 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8220e72b7b51ffaf05b5422267a350327e4dfef05fd78ed7e92cd19a6602f500 +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9964670efd182214ff2a79c7f53f2c5020ff01ad --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423ffc95956118d6fd695e205ab77a6272f2ab340f1843bab15057de859960be +size 199058722 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23df9fcc55300631b341d194e28394b2760736f7 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1e3559a0aba139bf54d7e3441bb692eac250f78f4788c9241065cec92da8b02 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8ed4e18ae4ec2c4beeef400bc84e1f63a88f6ae --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a27cf5c6ea0100280d247ce8a527a33885d8cfc73e5cc23ab8da8c9d9473285 +size 199058786 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3295badecb8f0c07dffe9da566449dc478deb8d7 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6b7658ed194df54f6e4114f280d04b9c9a04d7f36540cc786448e0d67e86fcd +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc9cbe42a9708499f06f8620be34c39476a81772 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16a99a0585683d9596754d3682e58604071caa004f0dcdfbc300b7880bbe94c2 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07567b45b66abfdc4c6ba56e83a0cf93f31e9a05 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee8f1e612eced4e9254b7cd06a32ed1bc17167a69b067f5a67dcc8142e7231c8 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a54efbc285e23c9f04e5a6effc3493920c09a0dd --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8144d00872b3cdff246508e8c4b6989f10de5e2bbd627be53ad66dec92b02 +size 199058658 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9613bb956de5058df032232121dafa1eb4edb47 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4cf9a236c0222b46b6c3bb3883532cc6b4a5d1f3a38043b92375423dcc4e7a6 +size 199058839 diff --git a/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b452b0596b6828c8c28612d56deeff4ff0d9f749 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0decb25550e74d6808e8b74f2d37a9b9f968ee59023127d6bc547b631b513e2f +size 199058839 diff --git a/4b284b84b10c4py/global_step80108/layer_01-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b87f708497f43f052b48ffa9d42f74a84b82c04f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80cd41d257dad5a4b45ac594acafd7950a33ff279c79a7401ef1785c56dd6d61 +size 167511299 diff --git a/4b284b84b10c4py/global_step80108/layer_01-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9204b13acd5e29915938ecd9350b7fc641abf2b3 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f7e2b93ae9d57f25f2f31db1712a9fda7b514de4f25114f02aec1eeb3f3963f +size 167511299 diff --git a/4b284b84b10c4py/global_step80108/layer_03-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8776ce01915fe5c5a403b5d02a58145a746e26fa --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a522122156f84abdaaf74906822f4ba4ba49dd0142deeb38a4085b68c6e209b9 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_03-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..671b542f4ae3a96a4e66d42d838ac18c245728de --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62b818c2c2008c9f02946d57884601442011fbec1de6c5ddc44203b330ff2e9a +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_04-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a18a66e658f1be882fc05971c4799712b18f5ec3 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc407a2b7a7380d118eba5959143f2da404a43b11dfed404aa111d54db71c31e +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_04-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f899d68c376de39fa227f6cf409da5c7659e17e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6976d3b60fcd43e89ef0f8f0ed85b22bb6483b48df8a14a6bcf8cd6e4c2809e8 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_05-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4026bc52022d10031c0af779cb9c2ab6252e3f9 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5235c64a3e1ca2e421543b2e50c07e1d8f5737bab41bbd0d1949d14c34e5650 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_05-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96c1926b9dc8e07a95991fc15a810b688a635a67 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8567b9f4c22a77256469fa06f3ed7a6bdcb86fd9a05af4c91591282cd73d92f4 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_06-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f21bf997252dda973b9e2866c97e8eefc99d14dc --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6631ceee29be545333e54766de6541c38be4179ef684329d28148c1c6e6c46c0 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_06-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcd0db560fec5a35299dbd01ffe5f50b3d014732 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd6c0ca4c8dfccf700989d60dbd27dea7f5a03af4100258859f926396cef30b +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_07-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c61a74f6c820ed6c05704ae3565ee4ccd6fc3db2 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e559a9be51054c47773f922d3e026e32ca614517aa33f5dbba7b6441bbd25a4f +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_07-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c81e1cfd3e9a876b1da5c49f8976a5add3c9114 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e91fb5f938514260fdb3b794c5304a3f2c08fca93bba12a245a1620e4a926739 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_08-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..282c57624ec6c219ac4df8e7f06950d5dc822da9 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46e0a44082b7deb8fad00ce000bf894d14897268b808d99244a5dd58ee8dcc72 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_08-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7045167f7f55b880b67527adf87ea67f7cfb138 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14999ff2bca6caf87e8d8e3eb9e0bd16b3000f576d6876a0f7c185b898166763 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_09-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86ea49546ad3a4aeb246f431894a7fc51320aaf4 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b8525ba98839702bec812c816883462848f4da93ee16c23f452309edb362688 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_09-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a61ce253fc8efbd4a0c5b29d82a20cd4e901c79 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e6565200c40a1ad352b94da82ec6da5d9cffb83cfc774160fe0c9052db16150 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_10-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1164e4f6fcf46165dc219390bc5a49cea9f912f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03120c9d65071d04b3e4f283eb99957dd8a73e05b214384c1e58b6374f78b028 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_10-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff6ae12eea0b63c48b702a52bff23315e034b2e8 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9badbc737ccfbde4a928ee2a08a778ade8befdb54c83cd264e33e66f70958091 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_11-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fbc74c7712a20f7f71c3409401e115ef980f519 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e077b8c5778a7c354f0116a84188d12923316900467520e2704135165f329a31 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_11-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b317eebfb92c902b69423910ff13db66a7d7ad04 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d736febe748fd61efba158dc261be715208c08b51ce854b738385deffe2a4e98 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_12-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b00e291d6748bef9bf0869cb6b73dee3a38a2dd3 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d5bbb4244bb8bb1048c4e7d7913693cad24f5d1631138fc151ed9fb94208bc +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_12-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..454cf0eeaefe935d5335df1f9bf289b716742ae6 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c41c962b2395aa73b2e0f13354e0d5a44e366e70bacf0c392ff204b22f1a6afd +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_13-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a766e85b4862ff6434c89c7402525212687d163 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15979e9eca01a61bb78ac3b3fa5c3a81972bcdb71c2eac3fd423d002592217b3 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_13-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..682de2443c91bb103a79e579b3d6043c74f90896 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12bbb682a025ce1199ac502c5e738975cfb73d01b8a436df4245674aefc03942 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_14-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66d82626991a34d0837cb91c2e63637ab9bf5f63 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b47a013c2de20d4af5db55ed6b6c1dad256947309621ff6bacfb85a5da2e8c39 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_14-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d34c592f076288050eea8cb80023ba7193aee55 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03fcafbdad5d58701fa187686b4170a0219c62c9a91e5dc94eabbbd153c55eed +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_15-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d09fb0292d8b88d80082a913bf9e782e309b1af --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bdac4abad17292294b687fecc7da51419e087eedf061ff6837953de317492e0 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_15-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d526bdca42e0135c2bf7e58a761fe9d1f47d6c --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d3195cb0ac91900f6723a9e099dca8af3effd76d3c8819965ff140318a05111 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_16-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0fce4ebf5f57cf9286d4d8ee66dfdce212492fb --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5145f474af86873cb269b3e78ccf55c37b6342030135f5a8752f953a24920cf +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_16-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14e5c2431b99881f91c9e692407c5a8ecb6df9db --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d762cfb010c364674686779f6f2b69ba4b27cad62b08706ea59f8d3ee6a51658 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_17-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a10b8e8a6164330557761b71ab385d2c4c1ce06a --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:793bfcbcd714bffb039fa800d8a37d71e9d0c659f01ba9158d3929c950533566 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_17-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dd425d24e396770e5add2d26d5a3fd814fd7c41 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fb6189f3597272ed3c70e87a53488ff82eaabb58c625b43a1e5ed0cde5968be +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_18-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3daf52a8074b9cbe0826c4667104eaccdd405f9 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66d28d6d90ee1388e96557783fd98d928b301e20007e319876b729dd4ae679cb +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_18-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6a2e3d1978278f8bb90ddf8f7d3f082943f0a52 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ae81faac496ad6b966cd0dd1438484f5e5dcf0e5e1ef436c80245f91202a28b +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_19-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e733779cf8b81d01a6486beb4aa01859715eb2ab --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b997f3655406d6f4d29b72725b18ce276cc4194ebde6985983d296ca90674341 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_19-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b29bd5302daa57c1502d1780a6edcfb417ce3c2 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:692bd7c29ba2fd0e6833d27084e09ddb1e6acadad66c76120d9185c971e5f99e +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_20-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1ae2a1646f7e9d090bd7ff3a4989770ac7ca88b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59571e1acfb94fbbf9b086f4d35ac0fcd1f76367eb194cffa4e8b2aa42fb033f +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_20-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c86b9d097c324420f6659142e92eee62cf3ca375 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4361a28a91f052345d15687af96b6dd445fd71e68a443afd39f6d801e6c057fb +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_21-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef38d1e11fd7a8786438b7b65242f2e50823f6d8 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c6f9f6ec83c82f3057f5aaef51ac83fbcadec3a36ca9d94c3a1128850cbe085 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_21-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f264ee16b54f07d177e67b636241c2563073155 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86ea3f6fd83484a421602fa92b11361d982470f527dc5bb0e66fce9c05fba9f7 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_22-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3493a612be526ba724544a7249576f37bada360 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15f819c50d4fdbcc83551ccf651fc3adce6822eb66d7c8a328194514e0eaf0df +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_22-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ec9beb6dc705884f92ef87edebce69da72b10a8 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ae964f96eec8e16e81722e509c7db9001e0700a46ffd98d9798b33ab47f5197 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_23-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ba154333f6686c879248141f2abf237b4f2f1ec --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5422e956b2beffe93f376079a414d9ee99ca84ee42ce5d1f4ffc75c6aeddbc77 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_23-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2c488bc215a7a06fe63a7e49fb54e3d65767725 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920bf5938c0fbb9b381493cfe6c047dab9dae9dd84d9bf648d88c62bb2bb1823 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_24-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0a42a534845b18511ecefd8314f22cd9668a7ea --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a68601c806d53c479db3f37cb84601a9898802d4be29cc103d4d2f2af909b8f0 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_24-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d8cec85272a6526cafd3c4b6efaf1eaca2a4538 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:725e0f37eb6ac840e0301e18661ef38e49d12b1662c10a8026037250664a216d +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_25-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0381d6447a747e6d5ae5bec199d0b6e61184170 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083f86745fb3abf6c6578327a5cd9395819d0921dbc7d7d5feb2329354ff798c +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_25-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77299b7e3208ff2014a832e98e57c6c2296f5597 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6931f7c70a702903207bad2b2a6c31f798d31ec5be7ab7d687beb8702502ca0b +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_26-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd7056c60887dd1356938a2a3b28864c692f8e81 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01de20365d978864225fde3b97dd355f77880626727b5faabe9f22e8f9c3ae67 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_26-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17db58882e0d38d53d899a84d62dac808b740497 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1de552b68459334f859c149d18ba56e4e0b436142987c0cb57a3434ab226d567 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_27-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7496551fc1d356827928e496abae3d756a23fbfd --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06793a1a1041f98811aebd049c990006d9d48a05be898733279ed4d7c14035cd +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_27-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab6581f7614c6600702968beb87d7dd28fb6054b --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65538a1cfe61cd0a1a97c3218bb9689b014e13380e9c4ea5936e6df84c1c8038 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_28-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36eef05c77319b47fc9cf11037d95f2d01dc57cc --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce16fbcc44443093247696759ae42d1246413f0c299ece346a271b37d5ccc39a +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_28-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73511067193ca3773e17b020331d61877c8f9d58 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87fbcf4ce3cbfabe87a926726e0c63ea75a39a50a1839b649f6589fabb67e2b2 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_29-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b37364dbcd6c15658208bb8b88e9f435fc02fbd1 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67fb9f9ca16ecc5bd9b182a61a712e4ea24919c9d379cc1cfc7816363c6be548 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_29-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d99ff9f0cce0a12c84191f5c1e2ea1207c2c210 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18087cbce6b7d55cb1b03a68925cb05d67827042b9779b26f306cb3f12c29de4 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_30-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..332481fcc1353331e4ed4fb668c43e905d98dfbf --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c175ec5b12b66e22944221b18c8e45399a12eeabe018e521c9ff7c2680c393d +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_30-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b9923bd3c332f6607993fe5fb2f33476c8ac381 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4b0b71d096f7035e7cf2544d2b59d8747d6d0d7df8e89ae3decce81f992e461 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_31-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e9a5e563bb1782baedcda369fe13bc1d03de23a --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba9af6af70a2b2611db9d9e9aac0e7c0bc1d21b8f9602fc7b57cdcc65b3e3f0e +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_31-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95a7419214ab61ce4a08e3bc87a9e0b4b9016ced --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1a78bc01b1a21ba522d0ac6b88f5eebdf2fac4bd1f78e4f132d0e94a0f69c84 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_32-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2182a468671b2d79586898353de5567cf6cac0b6 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84140cf0c37adc1e714d8a7f79c2576d638ba567024ac865f596b40ca3bc9445 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_32-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..186f701fa9a0c842a16f0e0a735096e7869fc597 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:226de305d47c31479a0a3177dfc289854f873fef5c9c56e07af782165da46769 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_33-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2a36a72dda4bd1bd1aeb27e6eb9ce4f85477d0f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27521004612888b440990700b8ae94a131688057b01941e5f8944d73e46cc455 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_33-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ace7ebd8996ec6408f20a9f056a5efe488efb6f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72e5691396e2e88ef6bf041ce537b723c28e8de6fa788cd38b09427e4f47e7a1 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_34-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d3a29d6413ef84cde89d8ceecabd1b3d8e9c3f6 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9a6c4805b2a953f4652e8d768c504d1d95cb8227686a0b0f0704c73d48136f1 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_34-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b00b19bcdc079786962d9b86bac08dfda98365e7 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bba236dc4d67569a1d461531455ab178ce76ce0b1ac74405329f73b6355eb13f +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_35-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8265c1aa72e2f09d1f391ea75ca1a5a9ba165a0e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d41c3cd59c8b9e88965d5d7794e8c43ed40eb3576f44e0d8865260042b44c6f +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_35-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf034e9b2b7ac00141592def1d9182f5e9c0b82e --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c1f71df940997caf68fbdf01048b4a16c2010b185fcb66c6fc7c9f57e25b57d +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_36-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63a9affea7f144f37c56ad976cb08b4e74a20373 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e7d103b8ed1d147c227c0fea0acc9679eb068318c81ce04d286cce6aff0fa57 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_36-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddbee899e5ef83bf63b7d8420429aa31a02f3fe1 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9e3c5d0a9006e5f3b57c04e7738d731f59a4160d2f42f79fbd7e061130c2b87 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_37-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..caa9e1a95bdd9ae77dda591929484360df3890ef --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a4e57cd64529f68f3398e4fa47ffacdfe161a854fecd0431cbab0c13afa8c85 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_37-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74876f8819b987a1dae3a874a84ab186654e0e9a --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9ac1475c911b77f735f41a47fbfb52c105d482a0bf1a38cf4457727d55bb19f +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_38-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fefed0894ee086ef75262ce744e46a15fc53f66 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0def9575927e6047c6c22457a8b43f375ba0b1113c5474bbc117aa1c76b03e92 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_38-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2af0b545ddba49a3a5557a4c3a3cf1d134afd5f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcb7467079f90d1e6f3a55a490d58fdcac3aa2dc418e39626d51175a61019766 +size 113308931 diff --git a/4b284b84b10c4py/global_step80108/layer_40-model_00-model_states.pt b/4b284b84b10c4py/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcd6a3959e5cdcad54af17d04faa70b5142bc88f --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a29e3e4efb21ceb966dcc6535619fcd302b9cc188f33d3957dfdca7eba212aaf +size 13507 diff --git a/4b284b84b10c4py/global_step80108/layer_40-model_01-model_states.pt b/4b284b84b10c4py/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..effce2dda4214d0e03ae7edacd1fc6a66052c275 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fbbd9d2b53e74c3c5e33e44c775c355779661298ef9b1b781d820cfeeaa6e28 +size 13507 diff --git a/4b284b84b10c4py/global_step80108/mp_rank_00_model_states.pt b/4b284b84b10c4py/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eb21fa62f2912c61a7d867129429ea063b2bcf1 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3b9202ce9b3a4f0acf2c9c85946c24536ba36cfeeb6c40300f75aff6fecead6 +size 51827 diff --git a/4b284b84b10c4py/global_step80108/mp_rank_01_model_states.pt b/4b284b84b10c4py/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77dc5638e5ec9d79d954d4ba9f051fa5ccfd72c2 --- /dev/null +++ b/4b284b84b10c4py/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:531fb6c34da7c3042398bc9bc35b38d7e5a1f7dea460d77fbc10a064a2ae0cd0 +size 51827 diff --git a/4b284b84b10c4py/transformers/config.json b/4b284b84b10c4py/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b84b10c4py/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b84b10c4py/transformers/merges.txt b/4b284b84b10c4py/transformers/merges.txt new file mode 100644 index 0000000000000000000000000000000000000000..cf4316427cc294a1140f596959a470a42fffa4d3 --- /dev/null +++ b/4b284b84b10c4py/transformers/merges.txt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce1664773c50f3e0cc8842619a93edc4624525b728b188a9e0be33b7726adc5 +size 456318 diff --git a/4b284b84b10c4py/transformers/pytorch_model.bin b/4b284b84b10c4py/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..1ccd988d1add608a2901964fcb0d73ade63ca819 --- /dev/null +++ b/4b284b84b10c4py/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c5d39183788c38e4bb7b3e78850ecfc428d65524f1f4fcf07e1fcce57c838d0 +size 8781203669 diff --git a/4b284b84b10c4py/transformers/tokenizer.json b/4b284b84b10c4py/transformers/tokenizer.json new file mode 100644 index 0000000000000000000000000000000000000000..0e99b0c1456fad7cbb09e6545c77cd19dc04f25e --- /dev/null +++ b/4b284b84b10c4py/transformers/tokenizer.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8414cab924d8b9b33013f0d221c5862f365ee9be39c5c2bfae8a5a9e970478a6 +size 1355256 diff --git a/4b284b84b10c4py/transformers/vocab.json b/4b284b84b10c4py/transformers/vocab.json new file mode 100644 index 0000000000000000000000000000000000000000..27c8a6dc955d9c5dd9d6fe5afb9a3d2d17865485 --- /dev/null +++ b/4b284b84b10c4py/transformers/vocab.json @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:196139668be63f3b5d6574427317ae82f612a97c5d1cdaf36ed2256dbf636783 +size 1042301