diff --git a/.gitattributes b/.gitattributes index 330e2dd2a7718d2117be1952cb03d8c549c542ac..e5db51ca52b64ac21199b285f1dd2d70183024bf 100644 --- a/.gitattributes +++ b/.gitattributes @@ -704,3 +704,195 @@ saved_model/**/* filter=lfs diff=lfs merge=lfs -text 4b284b42bc4seed2/evaluation/generation/examples.4b284b42bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text 4b284b17bc4seed3/evaluation/generation/examples.4b284b17bc4seed3_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text 4b284b42bc4seed2/evaluation/generation/examples.4b284b42bc4seed2_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_4.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text +4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl filter=lfs diff=lfs merge=lfs -text diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..7a0a0f8099d97f17df09bfa137b49d1d4ba982f8 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3066098749246226, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.026080136938068845}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07111826415088063, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002839089906272575}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2506712149564081, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004757508557066865}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08751164861028739, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00199981726737483}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03319077620530337, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0020231897791775106}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11077608891772334, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003107351453235033}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03876750875187201, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001265364536751268}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06647718723035836, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0026791734683438173}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.23570838504150982, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00455197819987753}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08166593395748795, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018388377390052121}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06672890451920119, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002733920332843438}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.23129644774314756, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0043201593384418835}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08123251691641209, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018438238359305395}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f4f30281d090dc3416080e7733aee4e66525d17d --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3038192608605564, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.015699254374158}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05683590873929071, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020467792157088907}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.27017378109951967, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004955059066352234}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08003564917768238, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016231021328505706}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02302654571104229, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013956717371657963}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11037888710881248, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030905387552418112}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03157133816619759, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009524060107538227}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05138484982672407, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019566614919068054}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24316258353203007, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004414830331308628}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07172579578796798, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014182749325865474}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05290704322980144, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019882546868578662}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.24942020154922606, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0044964221550096405}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07395133279168084, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014906191471968171}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..3a8bc9f224c986f9e5103198fc4cb46d24230ab3 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.2987651957407001, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.01165146487326007}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05700016441399435, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017866333928080581}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2804134367029925, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004805713426369978}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.0831895052852721, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001625324041245366}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02233985054458201, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010710584040813141}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11320206879663894, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002939251451992755}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.032089824292963406, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009447259591619087}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.04971200204444394, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015276050991763481}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24706303672621477, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004167944129872773}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07258794061798622, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013375852482102129}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05309006495197277, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016898819992046204}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2605549805843784, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004415202735971505}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.0771940777807749, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014906191322966035}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c5ee6deb13caa0d52a3dd775f687272ca2513f33 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3178292125394837, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.016436461817007326}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05949762170434375, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002164217791856107}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2804633597246112, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004772273934843173}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08130575650688132, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001537824456242504}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02315468230294224, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013116150015292844}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11210805274384686, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030446087077799903}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03098393961344455, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009090838201088959}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05296448349205633, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002039688636224555}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24654397231374384, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004152222617956148}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07145815124416759, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013532821520358354}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05596829767493985, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021073938497608454}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2610555009310582, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004427499077140127}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07576475402518883, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014334163239098205}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6cdc18cdbad605bc1861b97318bc77e09ac34925 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.33395098766218884, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.018968072553356623}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05735023477794692, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018410250349017107}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.29141762974212615, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004822950393157349}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08367597785312914, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016033089150747774}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.021651705429468177, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010514293026879199}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11750125883404142, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003178578433572342}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.031540027671483784, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009467316903388299}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.050054640877740926, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016864461898684513}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.25450526989064276, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004210704440467058}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07260423911237245, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001376149178581389}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05345237810332766, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017804800879000749}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2697483182511519, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004417715268392961}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07753657862492522, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001496405647152453}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b9e08e79ec85bc1ea268cb7e51bbc4233a92ed1b --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3641656854611542, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.015309152040195284}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.052896109217414104, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014365647910545604}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.28995885739987826, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00491862249100831}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.0809120070880779, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0014755261393375114}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.01993001210350518, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007373235006634328}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11732616625283977, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0031965230579063257}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.030494115579364812, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008357516400780779}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.04580220322739789, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001313492675076717}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.25087552702336663, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004197343182524436}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.06970781602649807, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012557281083211698}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.04920701939583041, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013657560657982203}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2686976948346208, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00450965297817273}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.0750837322403333, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001370229544506872}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f5ec1d214c4456c086c221c2768842c5e3618a6f --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.153949065103856, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018954240620966882}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.25650646122704474, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024640946950302985}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17763908527361025, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017411319281415913}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.028019269400656518, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007188326863079863}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04807149188073896, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012737937496356626}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03228562656211838, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007610456704112464}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.114473205278599, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013050419999849348}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1979090080195594, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019738106671277266}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1335773049328249, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001206400625022134}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1434687817382672, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001762712661710752}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24013798061889524, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002330459097368292}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16579309345906998, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016200879357240658}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.3310013488043524, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.051303312771233796}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a23d01bc33188c2635dc3114b81f0224c367d8d5 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15222498270112908, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018427545457994695}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2575304318026435, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025171368376624634}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17784343637401165, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017678913033546437}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.027223166689333656, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007022412791947103}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.047627933423561246, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012809278259731988}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03198373436508538, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007797542212099719}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10932432127036033, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001193214863192186}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19223797000244636, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001923076446257654}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1293204461841411, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001171111199270059}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1432522940492175, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017229652479762334}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2435323142827951, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002380294263101675}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16757050221415196, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016483223875673962}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.538506754528524, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05237098925801456}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..94a050dce993aa3d03abf18158e991f5bd18d327 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1563882321550081, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001888617387583986}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.26533453283498676, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025530833044838525}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1825901932807019, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001772393389777701}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03007920986659565, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007656205465392793}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05242348060271486, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001402785333640821}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03484256216837846, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008050464414919185}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11302771471874037, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012603520129098162}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19883145591680731, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001967593430993135}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.133378449269488, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0011786586689251871}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14736580481316963, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001773298946199036}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.25099172388853663, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024263653927730773}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17216601216038344, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016569952491396495}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.641398523262805, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05167522892405418}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..8164309fac9646a1bc05dc6938f135d94c3586f1 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1389473709497086, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002165945649654676}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.22609159173620905, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0029302654026930365}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.15630117454287198, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002033104554438234}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.026390272714025626, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007567994736605611}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04479360431887114, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013217939246997325}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.02997981495146458, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000789727045647715}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1008235900865201, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015515937317845793}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.16915259930611842, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002256313909124414}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.11400981222806023, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014106173327737745}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13075025696794762, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020447039924209433}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.21298194277055252, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027618131658537198}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.14696382199884428, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019053060135896015}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.6905078353779432, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07249934930658058}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..4187d35df80f7bd37db400196893f6c96ce83690 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.0489492492227955, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001789814805368641}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08138629581304692, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002787495081772674}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.053849493676637585, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018128550224799451}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.00954245354371464, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000496033168499096}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.017770514262613592, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001037990108744839}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.010951183251337409, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000542318137546649}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.036730466496340326, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013603756574255225}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06226680749750502, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002169104206622538}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04018322578320604, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013246122432655602}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.04606259413041724, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016946531131761852}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.07642507746995442, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026253735820234}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05051235209315841, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017010930529641197}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.39343180321276056, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0293119272772715}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ed3478fc303cb1b6a246defb71b8f4a7edf34e00 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.00785532086822979, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008059057817636163}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.012189729776176633, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0011529440251866266}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.008211770721120311, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007739119234145405}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.001629059190316381, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00023332897761005325}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0026264060986572716, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00038760636790030855}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0016759752492624186, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00021435787709352103}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006024210894010907, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.000610190662185335}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.009693715133781285, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009327234614976355}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006313837482340284, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005834402713093119}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.007292999371042805, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007486511125870423}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.01142399455584086, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0010918019151945164}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.007631652279250868, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007207775362203403}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 4.795621548580966e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 9.116423959336365e-07}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..77592b8a1a037bf6af137f2256845641103f29a8 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 1.3467292138388522, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0636854285236688}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.21376122377294582, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003423965804716776}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.11826204808312468, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0016068929332226103}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.12012011760848791, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0013303613929234116}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.04464223015901598, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015055825472803579}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.024459729176383012, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0007148574718681848}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.02367441172991871, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006343126685728484}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.17720781770238822, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0025232418694504655}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.10503799964127797, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001452728215385968}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.10396010404779424, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0010907224654039642}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.18148501626393876, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0027979704321773107}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.10087939658175359, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0014051358188386478}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.10215080373243925, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001109159488438079}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1ca130483428bf759cd3746062650411a02d7d3f --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 4.5480283931845324, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05660434588182871}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.23525526703689217, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002224131117862929}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.41213522865304736, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026261778490009914}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.28179765051154215, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018423691903722364}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.08756330373099659, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001382664098826369}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.15485417637322493, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001859705859804789}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.10436721293825027, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012564399976213632}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.18389946486758244, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017430632737902262}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3260598830971049, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021720923944008705}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2209222812840664, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014041408204809602}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.19611766071180928, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002000511520927801}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3429462721297835, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002447036789471601}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.23443730171613159, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016999346317063447}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..3ad80031ae2dca518fc306c6515ce5f701a3b9da --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 4.919099078160439, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07401079447832073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.22830891168453196, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020226351669978943}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.430501449249562, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025067528428449337}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.2848021533685038, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017517841909149951}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.08874046699895509, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012536346039166443}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.17058058024587597, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019277334580117154}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.11056535384060841, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012335424952574436}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.17874631886223866, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015432601430013146}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.34228892513027326, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021544507147917644}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.22429066792419844, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013639521320318918}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.19159590399736812, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017744554514183184}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.36333660692954056, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024452838301491264}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.23961627743436656, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016466360617377184}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..16db5676bfa9085573748796468a01be013febaf --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.161685848623118, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07262509824163077}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.2250406541329284, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018984959829563015}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4401409797987255, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024818459349912466}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.28625759764760766, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017505915200592458}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.08992659254313957, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012057214319225603}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.17962663745940138, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00190969756064409}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.11431119935407852, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012264659705919982}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.17814189014708015, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001501724354676948}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3526106772291693, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021197068010549917}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.22718964393483773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001341523865438878}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.19224724023096493, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017539464959385562}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.375736139296112, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024062560460738677}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.24420233251967818, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016511867365175956}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..735c1fc292b3a224672e84c5f29eeb68b8cd91c7 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.3863626535773195, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08316568360369772}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.22591638424042498, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001851012114615343}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.44465520609703646, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024822890206687306}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.2884803003096355, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017316301619347632}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.09137947270797166, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011328131792298333}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.18516155808078238, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019428991404911535}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.11718583569111816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00121705170719205}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.17791538730013262, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001385852845968636}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3555171974183999, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021223337675852177}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.22838715083098254, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013209819868746765}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.1934093946653807, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016535132345320634}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3819852960374735, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024230711787691338}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2473033223648628, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001629820147671333}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..35e2613d7541f8ac921b1a4e93219f73bb47d71e --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.218311341485651, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08555182976780383}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.22420804212245024, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018931092685607832}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.43645148946569756, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0023925455584187143}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.2851279405049657, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017156941599383252}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.08976861428854209, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012265411317482072}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.17860416167471355, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001894485841362118}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.11398867145332987, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012184034191725704}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.17705341704222277, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001496237569767933}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3489555989991215, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020756478234175003}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.22589371892600646, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001329494456764217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.19291128629856713, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001743268774937326}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3757535087761027, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023376729302477164}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.24529704048909337, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016364362199438327}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..79d8f40fa66933fa1da6758c362cdefa22d3b60b --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1404335293516036, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018475752933584198}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.33304948876480905, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0038506848151682277}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.19317514090993446, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022112014874136276}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.026070215267481753, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009166794828332532}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06470743754786817, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022637761051235894}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03629759048462241, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012314297081491255}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.1032551941800083, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013020422069113654}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24743139771736608, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0029799847541024864}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14245726390092303, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001599761390324437}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.11056793408323284, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014447008795606224}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2644863518283602, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003301240029680331}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1525513019630977, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018062738518410612}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.2992802626075217, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08613536173053919}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..60647b4aaea58123fc0502bba3eaffdba4139a30 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11583572927874138, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015868267173138404}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.28673470669230483, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003637777293225723}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.163100228567693, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002132266466808726}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01724716231152785, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007449366916925016}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.04477737050796163, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00198811760305303}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.02461427079155061, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001063162698284129}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08830410964622547, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011164040071930121}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.22077364895161825, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0027438079045214113}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12465414516933276, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001518543329628805}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09327309336629477, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001264500539576057}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23298075051437098, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003053175396768166}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13165914823095848, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001722148826191323}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.9392811645900702, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07096662177652757}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..048ec82d56fc0b016468b3488aea6bf57f4e9e61 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11587525551966481, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016045754710452714}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2874887710310145, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003567488833961318}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.16310151647769613, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021173776446693038}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01786609643978251, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007624665922748118}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.046073666078135844, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00202411128686605}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.02540910163910677, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010850659455729865}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08869240853211423, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011665769716760525}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2219053477816373, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002750331221052164}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12516134814219937, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015660208564047945}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09346436388002839, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012938167406065764}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23423731441915813, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003085268456864704}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13195206984139488, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017467533202419128}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.8642738469290718, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0828969271702355}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9512174ee48f944e0806830a92ac9ff22336c910 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11296838065461887, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017763597852222038}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2719068297050645, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0038490332935536237}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.15604881038304613, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022637041314365453}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01707269817022361, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007693549928763936}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.042123589858273434, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018755138592056807}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.023753467717060665, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010443537949278742}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08602111381227089, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001348786781692891}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20806883128782105, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0029718527370379577}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11872182977619025, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016793576149961092}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09123263400217625, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014417280224893359}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22083691751530135, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031880991373431033}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12609518726408814, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018237508130951488}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.8836853896564532, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04539990589714401}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..81b3badb361d48663a2b802314e44bade206c259 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.034882897379201874, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002246767493274493}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.06473914976317797, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0037002010817473985}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04091181078946866, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022902327278297046}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0038285864418821543, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00040689869864601153}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.009305544911384899, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0009789224679047535}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0052797964519696655, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005471044968877006}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.027308146633009903, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019083153741966364}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.04967049431208105, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0028488023843374856}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03128707048743581, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017437540939162011}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.028950850747643437, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019932883821356198}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.05263176539885643, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003033293906854166}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03330241832085698, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018775032498108398}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.32264946943694406, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06831405512505326}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1e44158e683e89329026b9f0f11966f9f886b0c7 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/agg.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.002234714565312147, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0006324566810963234}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0019083246709728258, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0005363735849273349}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002011613476498758, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0005611516641301552}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.000275577641004944, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00018655929326294164}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00024871355060034306, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00018003279128987707}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00025972087637987314, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00018245934977293284}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0017513556534527388, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005186881670205111}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0015379808798967414, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00045866786099632605}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0015954209721237727, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00046728726635727905}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.001897742561259706, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0005481199006190125}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0016448900434096786, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0004764592460236093}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0017182753671868714, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0004901161371032653}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.7543632002989705e-39, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.694640730371467e-33}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8a4ff01c1afa8805301e508e8d2192d9ff6ad524 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49040058d6debefcb559ec926000a7b06a49758f7a2a0cdc791692d2f1fb07e3 +size 4039112 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1752b06473317c6bce241c7035b66cf875851c30 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdfb213249bbd852ec13d258d91cda4b080ee251f0eab98d03e15c5a60c4da0b +size 5113528 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8dbcd6686fe3e8a203dde312a222375d7e21eea7 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d899592edd11e02fd8a38fa6ac622d734c255193b484adaabacb25a6e57de3 +size 6029118 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3b462d46f9f466970237d3f49793e4ccd12f0a87 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a3f8682648ca1756fa7692d7312d7156e1e1481b6194f91823e5e49350852c +size 6952945 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..295cc03e90c6ad647d2603c3f31b7e84167f5455 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc7736aa07934bb7c99d3266ea7defe571220ff1235dee52f8881db83f961470 +size 7862477 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5452f49a378b4e4340c9804ca20368e1fe10a7cf --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cb6142d74f5ad4c96f73193293a929e0acf7ac48a128cf2401b0baa1c122dce +size 8753486 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..aca41f77eede3cc7ab61190e5009e604d92ecd65 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c89abf4c3744908e7e3153ad403aef3602cc6f8111e594ef61b7a520b11c87 +size 7705828 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7a1ee7f7f79a8d985e9d482fde224b28494b387b --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba7fe507c24cd59222124adb63586c0095fc898f3556853127ec27251e2fa094 +size 13328191 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..765befc7e220aef336288fd190bfa2417c72c988 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6e6665174c357f76bf325f0ad6efcc001f79f5ed05496009b405464063734e3 +size 18931505 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..12fcc4be4467caf6ba4043054d05a8cca94602a7 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20876626220bac82c9dbbeb74fe9072386b9511ade7fa96ebbca809e35c8881 +size 24350316 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5ed74daaa9255a6cd1b16abc9b29309454179b65 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b31bf332fb11978501273e5ca5dd247afcbfcbb9723284e26e2782d3919fe3c +size 29481257 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8170ea28ddaa5a525abc7954acc1eec355c51f7c --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59a34e030acea853d9312fbbedb13c69ec0ea699255d9b060c8e39d434fd5e53 +size 34800856 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..25671b23f508aade3067a947fdd7b8e1733f84f7 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b3a0d26ef34e2db3e8cb02e5bf0d855bbc84ed95dc88fd80ae1789b357d0c4e +size 3990292 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2f41e75228181ccdb698c13433681aef29e0e15b --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e9c5c75f074b044c98069cacd69201e4089e2302f4544974a9e45436259b4cf +size 5462654 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..624d7627e02e484c0856270646396ec8d9b89417 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d62b5ace3ffc224ac329adcc1caeaac74b9414dc7f357a3bdd9e00c0bb6b6fe +size 6573997 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2107acbe2c3dbee4cef2c7009d40b528f70e5ae8 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de749d4e4eefcf7c2ce0aff2709ad42739df392dc2976bd1d6a7bb6a75c4451a +size 7670556 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8f128a5e0898629d3d0529cc8ef3a6c25417fd19 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bd7526246102a05dfb00eae954bde266d337214c400844f443c9323331e07a6 +size 8750887 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..25faa87f541c1abea7812ba41e1765ddcab66d24 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e481d38c14c111b07e38ae4084b8e239cbf10308ad4868e28956c709ec8bee +size 9831027 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_0.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f7ec829d17d15f3fbc789abfa7792e2d1c9af7bd --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:251feb7a4e5545a9f2320eb976e6a5a5126b6955825c303a7e0b2de12c5b6c54 +size 2832154 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_1.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7e07c90232c8511d1bbab3471e0091e968d00e19 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49d110205e8b46f0f7c106d33f3461072bef57d867472bc9a61a03f5f5f7a869 +size 5104545 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_2.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fc5a68bae893c4e9077d9e76bab7ded57c0d10d5 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1c360e55c63be1aa69064c5b4fd716ded7fe68b6142a0da27abd1de34901593 +size 7377687 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_3.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c7039f5ed2d27f2821dace3bebe87497264053ac --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba512f0783919f8452de0d5ca4a328aa6aa5c54bef202f5209814fa78eb540fd +size 9646312 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_4.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..32dddd8392dfb0f22bf9b8069f2ba83edcaa06ed --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d505782a29b65c703b8d25b53ab6c79c1c17846fa4ccbcad6613f91643a7aad +size 11673079 diff --git a/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_5.jsonl b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5d30ccd88630dc24c867a824e9fe6c4af191c8c5 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/examples.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:452e6b3a06898a2e7a5f47203c63f409dc9a3fe5c857ab28a0fccac9a936811e +size 13897438 diff --git a/4b284b1b9c4seed1/evaluation/generation/merged.csv b/4b284b1b9c4seed1/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..114a987f5317830bcf7ce9814025fdd961ed73d3 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.02367441172991871 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.02367441172991871 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.10436721293825027 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.10436721293825027 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.11056535384060841 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.11056535384060841 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.11431119935407852 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.11431119935407852 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.11718583569111816 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.11718583569111816 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.11398867145332987 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.11398867145332987 +e2e_nlg_cleaned,5,average,multiple,0.09734878083455066 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.03629759048462241 +gem_xsum,0,median,rouge2_fmeasure,0.03629759048462241 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.02461427079155061 +gem_xsum,1,median,rouge2_fmeasure,0.02461427079155061 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.02540910163910677 +gem_xsum,2,median,rouge2_fmeasure,0.02540910163910677 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.023753467717060665 +gem_xsum,3,median,rouge2_fmeasure,0.023753467717060665 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.0052797964519696655 +gem_xsum,4,median,rouge2_fmeasure,0.0052797964519696655 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00025972087637987314 +gem_xsum,5,median,rouge2_fmeasure,0.00025972087637987314 +gem_xsum,5,average,multiple,0.019268991326781667 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.03876750875187201 +web_nlg_en,0,median,rouge2_fmeasure,0.03876750875187201 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.03157133816619759 +web_nlg_en,1,median,rouge2_fmeasure,0.03157133816619759 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.032089824292963406 +web_nlg_en,2,median,rouge2_fmeasure,0.032089824292963406 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.03098393961344455 +web_nlg_en,3,median,rouge2_fmeasure,0.03098393961344455 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.031540027671483784 +web_nlg_en,4,median,rouge2_fmeasure,0.031540027671483784 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.030494115579364812 +web_nlg_en,5,median,rouge2_fmeasure,0.030494115579364812 +web_nlg_en,5,average,multiple,0.03257445901255436 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.03228562656211838 +wiki_lingua_en,0,median,rouge2_fmeasure,0.03228562656211838 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.03198373436508538 +wiki_lingua_en,1,median,rouge2_fmeasure,0.03198373436508538 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.03484256216837846 +wiki_lingua_en,2,median,rouge2_fmeasure,0.03484256216837846 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.02997981495146458 +wiki_lingua_en,3,median,rouge2_fmeasure,0.02997981495146458 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.010951183251337409 +wiki_lingua_en,4,median,rouge2_fmeasure,0.010951183251337409 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0016759752492624186 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0016759752492624186 +wiki_lingua_en,5,average,multiple,0.023619816091274438 diff --git a/4b284b1b9c4seed1/evaluation/generation/merged.json b/4b284b1b9c4seed1/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..aa49262efb1daeeabe0471efb3d556e965e006bd --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.3066098749246226, "bleu_stderr": 0.026080136938068845, "rouge1_fmeasure": 0.08751164861028739, "rouge1_fmeasure_stderr": 0.00199981726737483, "rouge1_precision": 0.07111826415088063, "rouge1_precision_stderr": 0.002839089906272575, "rouge1_recall": 0.2506712149564081, "rouge1_recall_stderr": 0.004757508557066865, "rouge2_fmeasure": 0.03876750875187201, "rouge2_fmeasure_stderr": 0.001265364536751268, "rouge2_precision": 0.03319077620530337, "rouge2_precision_stderr": 0.0020231897791775106, "rouge2_recall": 0.11077608891772334, "rouge2_recall_stderr": 0.003107351453235033, "rougeL_fmeasure": 0.08166593395748795, "rougeL_fmeasure_stderr": 0.0018388377390052121, "rougeL_precision": 0.06647718723035836, "rougeL_precision_stderr": 0.0026791734683438173, "rougeL_recall": 0.23570838504150982, "rougeL_recall_stderr": 0.00455197819987753, "rougeLsum_fmeasure": 0.08123251691641209, "rougeLsum_fmeasure_stderr": 0.0018438238359305395, "rougeLsum_precision": 0.06672890451920119, "rougeLsum_precision_stderr": 0.002733920332843438, "rougeLsum_recall": 0.23129644774314756, "rougeLsum_recall_stderr": 0.0043201593384418835}}, "1": {"PALM_prompt": {"bleu": 0.3038192608605564, "bleu_stderr": 0.015699254374158, "rouge1_fmeasure": 0.08003564917768238, "rouge1_fmeasure_stderr": 0.0016231021328505706, "rouge1_precision": 0.05683590873929071, "rouge1_precision_stderr": 0.0020467792157088907, "rouge1_recall": 0.27017378109951967, "rouge1_recall_stderr": 0.004955059066352234, "rouge2_fmeasure": 0.03157133816619759, "rouge2_fmeasure_stderr": 0.0009524060107538227, "rouge2_precision": 0.02302654571104229, "rouge2_precision_stderr": 0.0013956717371657963, "rouge2_recall": 0.11037888710881248, "rouge2_recall_stderr": 0.0030905387552418112, "rougeL_fmeasure": 0.07172579578796798, "rougeL_fmeasure_stderr": 0.0014182749325865474, "rougeL_precision": 0.05138484982672407, "rougeL_precision_stderr": 0.0019566614919068054, "rougeL_recall": 0.24316258353203007, "rougeL_recall_stderr": 0.004414830331308628, "rougeLsum_fmeasure": 0.07395133279168084, "rougeLsum_fmeasure_stderr": 0.0014906191471968171, "rougeLsum_precision": 0.05290704322980144, "rougeLsum_precision_stderr": 0.0019882546868578662, "rougeLsum_recall": 0.24942020154922606, "rougeLsum_recall_stderr": 0.0044964221550096405}}, "2": {"PALM_prompt": {"bleu": 0.2987651957407001, "bleu_stderr": 0.01165146487326007, "rouge1_fmeasure": 0.0831895052852721, "rouge1_fmeasure_stderr": 0.001625324041245366, "rouge1_precision": 0.05700016441399435, "rouge1_precision_stderr": 0.0017866333928080581, "rouge1_recall": 0.2804134367029925, "rouge1_recall_stderr": 0.004805713426369978, "rouge2_fmeasure": 0.032089824292963406, "rouge2_fmeasure_stderr": 0.0009447259591619087, "rouge2_precision": 0.02233985054458201, "rouge2_precision_stderr": 0.0010710584040813141, "rouge2_recall": 0.11320206879663894, "rouge2_recall_stderr": 0.002939251451992755, "rougeL_fmeasure": 0.07258794061798622, "rougeL_fmeasure_stderr": 0.0013375852482102129, "rougeL_precision": 0.04971200204444394, "rougeL_precision_stderr": 0.0015276050991763481, "rougeL_recall": 0.24706303672621477, "rougeL_recall_stderr": 0.004167944129872773, "rougeLsum_fmeasure": 0.0771940777807749, "rougeLsum_fmeasure_stderr": 0.0014906191322966035, "rougeLsum_precision": 0.05309006495197277, "rougeLsum_precision_stderr": 0.0016898819992046204, "rougeLsum_recall": 0.2605549805843784, "rougeLsum_recall_stderr": 0.004415202735971505}}, "3": {"PALM_prompt": {"bleu": 0.3178292125394837, "bleu_stderr": 0.016436461817007326, "rouge1_fmeasure": 0.08130575650688132, "rouge1_fmeasure_stderr": 0.001537824456242504, "rouge1_precision": 0.05949762170434375, "rouge1_precision_stderr": 0.002164217791856107, "rouge1_recall": 0.2804633597246112, "rouge1_recall_stderr": 0.004772273934843173, "rouge2_fmeasure": 0.03098393961344455, "rouge2_fmeasure_stderr": 0.0009090838201088959, "rouge2_precision": 0.02315468230294224, "rouge2_precision_stderr": 0.0013116150015292844, "rouge2_recall": 0.11210805274384686, "rouge2_recall_stderr": 0.0030446087077799903, "rougeL_fmeasure": 0.07145815124416759, "rougeL_fmeasure_stderr": 0.0013532821520358354, "rougeL_precision": 0.05296448349205633, "rougeL_precision_stderr": 0.002039688636224555, "rougeL_recall": 0.24654397231374384, "rougeL_recall_stderr": 0.004152222617956148, "rougeLsum_fmeasure": 0.07576475402518883, "rougeLsum_fmeasure_stderr": 0.0014334163239098205, "rougeLsum_precision": 0.05596829767493985, "rougeLsum_precision_stderr": 0.0021073938497608454, "rougeLsum_recall": 0.2610555009310582, "rougeLsum_recall_stderr": 0.004427499077140127}}, "4": {"PALM_prompt": {"bleu": 0.33395098766218884, "bleu_stderr": 0.018968072553356623, "rouge1_fmeasure": 0.08367597785312914, "rouge1_fmeasure_stderr": 0.0016033089150747774, "rouge1_precision": 0.05735023477794692, "rouge1_precision_stderr": 0.0018410250349017107, "rouge1_recall": 0.29141762974212615, "rouge1_recall_stderr": 0.004822950393157349, "rouge2_fmeasure": 0.031540027671483784, "rouge2_fmeasure_stderr": 0.0009467316903388299, "rouge2_precision": 0.021651705429468177, "rouge2_precision_stderr": 0.0010514293026879199, "rouge2_recall": 0.11750125883404142, "rouge2_recall_stderr": 0.003178578433572342, "rougeL_fmeasure": 0.07260423911237245, "rougeL_fmeasure_stderr": 0.001376149178581389, "rougeL_precision": 0.050054640877740926, "rougeL_precision_stderr": 0.0016864461898684513, "rougeL_recall": 0.25450526989064276, "rougeL_recall_stderr": 0.004210704440467058, "rougeLsum_fmeasure": 0.07753657862492522, "rougeLsum_fmeasure_stderr": 0.001496405647152453, "rougeLsum_precision": 0.05345237810332766, "rougeLsum_precision_stderr": 0.0017804800879000749, "rougeLsum_recall": 0.2697483182511519, "rougeLsum_recall_stderr": 0.004417715268392961}}, "5": {"PALM_prompt": {"bleu": 0.3641656854611542, "bleu_stderr": 0.015309152040195284, "rouge1_fmeasure": 0.0809120070880779, "rouge1_fmeasure_stderr": 0.0014755261393375114, "rouge1_precision": 0.052896109217414104, "rouge1_precision_stderr": 0.0014365647910545604, "rouge1_recall": 0.28995885739987826, "rouge1_recall_stderr": 0.00491862249100831, "rouge2_fmeasure": 0.030494115579364812, "rouge2_fmeasure_stderr": 0.0008357516400780779, "rouge2_precision": 0.01993001210350518, "rouge2_precision_stderr": 0.0007373235006634328, "rouge2_recall": 0.11732616625283977, "rouge2_recall_stderr": 0.0031965230579063257, "rougeL_fmeasure": 0.06970781602649807, "rougeL_fmeasure_stderr": 0.0012557281083211698, "rougeL_precision": 0.04580220322739789, "rougeL_precision_stderr": 0.001313492675076717, "rougeL_recall": 0.25087552702336663, "rougeL_recall_stderr": 0.004197343182524436, "rougeLsum_fmeasure": 0.0750837322403333, "rougeLsum_fmeasure_stderr": 0.001370229544506872, "rougeLsum_precision": 0.04920701939583041, "rougeLsum_precision_stderr": 0.0013657560657982203, "rougeLsum_recall": 0.2686976948346208, "rougeLsum_recall_stderr": 0.00450965297817273}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.3310013488043524, "bleu_stderr": 0.051303312771233796, "rouge1_fmeasure": 0.17763908527361025, "rouge1_fmeasure_stderr": 0.0017411319281415913, "rouge1_precision": 0.153949065103856, "rouge1_precision_stderr": 0.0018954240620966882, "rouge1_recall": 0.25650646122704474, "rouge1_recall_stderr": 0.0024640946950302985, "rouge2_fmeasure": 0.03228562656211838, "rouge2_fmeasure_stderr": 0.0007610456704112464, "rouge2_precision": 0.028019269400656518, "rouge2_precision_stderr": 0.0007188326863079863, "rouge2_recall": 0.04807149188073896, "rouge2_recall_stderr": 0.0012737937496356626, "rougeL_fmeasure": 0.1335773049328249, "rougeL_fmeasure_stderr": 0.001206400625022134, "rougeL_precision": 0.114473205278599, "rougeL_precision_stderr": 0.0013050419999849348, "rougeL_recall": 0.1979090080195594, "rougeL_recall_stderr": 0.0019738106671277266, "rougeLsum_fmeasure": 0.16579309345906998, "rougeLsum_fmeasure_stderr": 0.0016200879357240658, "rougeLsum_precision": 0.1434687817382672, "rougeLsum_precision_stderr": 0.001762712661710752, "rougeLsum_recall": 0.24013798061889524, "rougeLsum_recall_stderr": 0.002330459097368292}}, "1": {"tldr_en": {"bleu": 1.538506754528524, "bleu_stderr": 0.05237098925801456, "rouge1_fmeasure": 0.17784343637401165, "rouge1_fmeasure_stderr": 0.0017678913033546437, "rouge1_precision": 0.15222498270112908, "rouge1_precision_stderr": 0.0018427545457994695, "rouge1_recall": 0.2575304318026435, "rouge1_recall_stderr": 0.0025171368376624634, "rouge2_fmeasure": 0.03198373436508538, "rouge2_fmeasure_stderr": 0.0007797542212099719, "rouge2_precision": 0.027223166689333656, "rouge2_precision_stderr": 0.0007022412791947103, "rouge2_recall": 0.047627933423561246, "rouge2_recall_stderr": 0.0012809278259731988, "rougeL_fmeasure": 0.1293204461841411, "rougeL_fmeasure_stderr": 0.001171111199270059, "rougeL_precision": 0.10932432127036033, "rougeL_precision_stderr": 0.001193214863192186, "rougeL_recall": 0.19223797000244636, "rougeL_recall_stderr": 0.001923076446257654, "rougeLsum_fmeasure": 0.16757050221415196, "rougeLsum_fmeasure_stderr": 0.0016483223875673962, "rougeLsum_precision": 0.1432522940492175, "rougeLsum_precision_stderr": 0.0017229652479762334, "rougeLsum_recall": 0.2435323142827951, "rougeLsum_recall_stderr": 0.002380294263101675}}, "2": {"tldr_en": {"bleu": 1.641398523262805, "bleu_stderr": 0.05167522892405418, "rouge1_fmeasure": 0.1825901932807019, "rouge1_fmeasure_stderr": 0.001772393389777701, "rouge1_precision": 0.1563882321550081, "rouge1_precision_stderr": 0.001888617387583986, "rouge1_recall": 0.26533453283498676, "rouge1_recall_stderr": 0.0025530833044838525, "rouge2_fmeasure": 0.03484256216837846, "rouge2_fmeasure_stderr": 0.0008050464414919185, "rouge2_precision": 0.03007920986659565, "rouge2_precision_stderr": 0.0007656205465392793, "rouge2_recall": 0.05242348060271486, "rouge2_recall_stderr": 0.001402785333640821, "rougeL_fmeasure": 0.133378449269488, "rougeL_fmeasure_stderr": 0.0011786586689251871, "rougeL_precision": 0.11302771471874037, "rougeL_precision_stderr": 0.0012603520129098162, "rougeL_recall": 0.19883145591680731, "rougeL_recall_stderr": 0.001967593430993135, "rougeLsum_fmeasure": 0.17216601216038344, "rougeLsum_fmeasure_stderr": 0.0016569952491396495, "rougeLsum_precision": 0.14736580481316963, "rougeLsum_precision_stderr": 0.001773298946199036, "rougeLsum_recall": 0.25099172388853663, "rougeLsum_recall_stderr": 0.0024263653927730773}}, "3": {"tldr_en": {"bleu": 1.6905078353779432, "bleu_stderr": 0.07249934930658058, "rouge1_fmeasure": 0.15630117454287198, "rouge1_fmeasure_stderr": 0.002033104554438234, "rouge1_precision": 0.1389473709497086, "rouge1_precision_stderr": 0.002165945649654676, "rouge1_recall": 0.22609159173620905, "rouge1_recall_stderr": 0.0029302654026930365, "rouge2_fmeasure": 0.02997981495146458, "rouge2_fmeasure_stderr": 0.000789727045647715, "rouge2_precision": 0.026390272714025626, "rouge2_precision_stderr": 0.0007567994736605611, "rouge2_recall": 0.04479360431887114, "rouge2_recall_stderr": 0.0013217939246997325, "rougeL_fmeasure": 0.11400981222806023, "rougeL_fmeasure_stderr": 0.0014106173327737745, "rougeL_precision": 0.1008235900865201, "rougeL_precision_stderr": 0.0015515937317845793, "rougeL_recall": 0.16915259930611842, "rougeL_recall_stderr": 0.002256313909124414, "rougeLsum_fmeasure": 0.14696382199884428, "rougeLsum_fmeasure_stderr": 0.0019053060135896015, "rougeLsum_precision": 0.13075025696794762, "rougeLsum_precision_stderr": 0.0020447039924209433, "rougeLsum_recall": 0.21298194277055252, "rougeLsum_recall_stderr": 0.0027618131658537198}}, "4": {"tldr_en": {"bleu": 0.39343180321276056, "bleu_stderr": 0.0293119272772715, "rouge1_fmeasure": 0.053849493676637585, "rouge1_fmeasure_stderr": 0.0018128550224799451, "rouge1_precision": 0.0489492492227955, "rouge1_precision_stderr": 0.001789814805368641, "rouge1_recall": 0.08138629581304692, "rouge1_recall_stderr": 0.002787495081772674, "rouge2_fmeasure": 0.010951183251337409, "rouge2_fmeasure_stderr": 0.000542318137546649, "rouge2_precision": 0.00954245354371464, "rouge2_precision_stderr": 0.000496033168499096, "rouge2_recall": 0.017770514262613592, "rouge2_recall_stderr": 0.001037990108744839, "rougeL_fmeasure": 0.04018322578320604, "rougeL_fmeasure_stderr": 0.0013246122432655602, "rougeL_precision": 0.036730466496340326, "rougeL_precision_stderr": 0.0013603756574255225, "rougeL_recall": 0.06226680749750502, "rougeL_recall_stderr": 0.002169104206622538, "rougeLsum_fmeasure": 0.05051235209315841, "rougeLsum_fmeasure_stderr": 0.0017010930529641197, "rougeLsum_precision": 0.04606259413041724, "rougeLsum_precision_stderr": 0.0016946531131761852, "rougeLsum_recall": 0.07642507746995442, "rougeLsum_recall_stderr": 0.0026253735820234}}, "5": {"tldr_en": {"bleu": 4.795621548580966e-07, "bleu_stderr": 9.116423959336365e-07, "rouge1_fmeasure": 0.008211770721120311, "rouge1_fmeasure_stderr": 0.0007739119234145405, "rouge1_precision": 0.00785532086822979, "rouge1_precision_stderr": 0.0008059057817636163, "rouge1_recall": 0.012189729776176633, "rouge1_recall_stderr": 0.0011529440251866266, "rouge2_fmeasure": 0.0016759752492624186, "rouge2_fmeasure_stderr": 0.00021435787709352103, "rouge2_precision": 0.001629059190316381, "rouge2_precision_stderr": 0.00023332897761005325, "rouge2_recall": 0.0026264060986572716, "rouge2_recall_stderr": 0.00038760636790030855, "rougeL_fmeasure": 0.006313837482340284, "rougeL_fmeasure_stderr": 0.0005834402713093119, "rougeL_precision": 0.006024210894010907, "rougeL_precision_stderr": 0.000610190662185335, "rougeL_recall": 0.009693715133781285, "rougeL_recall_stderr": 0.0009327234614976355, "rougeLsum_fmeasure": 0.007631652279250868, "rougeLsum_fmeasure_stderr": 0.0007207775362203403, "rougeLsum_precision": 0.007292999371042805, "rougeLsum_precision_stderr": 0.0007486511125870423, "rougeLsum_recall": 0.01142399455584086, "rougeLsum_recall_stderr": 0.0010918019151945164}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 1.3467292138388522, "bleu_stderr": 0.0636854285236688, "rouge1_fmeasure": 0.12012011760848791, "rouge1_fmeasure_stderr": 0.0013303613929234116, "rouge1_precision": 0.21376122377294582, "rouge1_precision_stderr": 0.003423965804716776, "rouge1_recall": 0.11826204808312468, "rouge1_recall_stderr": 0.0016068929332226103, "rouge2_fmeasure": 0.02367441172991871, "rouge2_fmeasure_stderr": 0.0006343126685728484, "rouge2_precision": 0.04464223015901598, "rouge2_precision_stderr": 0.0015055825472803579, "rouge2_recall": 0.024459729176383012, "rouge2_recall_stderr": 0.0007148574718681848, "rougeL_fmeasure": 0.10396010404779424, "rougeL_fmeasure_stderr": 0.0010907224654039642, "rougeL_precision": 0.17720781770238822, "rougeL_precision_stderr": 0.0025232418694504655, "rougeL_recall": 0.10503799964127797, "rougeL_recall_stderr": 0.001452728215385968, "rougeLsum_fmeasure": 0.10215080373243925, "rougeLsum_fmeasure_stderr": 0.001109159488438079, "rougeLsum_precision": 0.18148501626393876, "rougeLsum_precision_stderr": 0.0027979704321773107, "rougeLsum_recall": 0.10087939658175359, "rougeLsum_recall_stderr": 0.0014051358188386478}}, "1": {"generate_text_restaurant": {"bleu": 4.5480283931845324, "bleu_stderr": 0.05660434588182871, "rouge1_fmeasure": 0.28179765051154215, "rouge1_fmeasure_stderr": 0.0018423691903722364, "rouge1_precision": 0.23525526703689217, "rouge1_precision_stderr": 0.002224131117862929, "rouge1_recall": 0.41213522865304736, "rouge1_recall_stderr": 0.0026261778490009914, "rouge2_fmeasure": 0.10436721293825027, "rouge2_fmeasure_stderr": 0.0012564399976213632, "rouge2_precision": 0.08756330373099659, "rouge2_precision_stderr": 0.001382664098826369, "rouge2_recall": 0.15485417637322493, "rouge2_recall_stderr": 0.001859705859804789, "rougeL_fmeasure": 0.2209222812840664, "rougeL_fmeasure_stderr": 0.0014041408204809602, "rougeL_precision": 0.18389946486758244, "rougeL_precision_stderr": 0.0017430632737902262, "rougeL_recall": 0.3260598830971049, "rougeL_recall_stderr": 0.0021720923944008705, "rougeLsum_fmeasure": 0.23443730171613159, "rougeLsum_fmeasure_stderr": 0.0016999346317063447, "rougeLsum_precision": 0.19611766071180928, "rougeLsum_precision_stderr": 0.002000511520927801, "rougeLsum_recall": 0.3429462721297835, "rougeLsum_recall_stderr": 0.002447036789471601}}, "2": {"generate_text_restaurant": {"bleu": 4.919099078160439, "bleu_stderr": 0.07401079447832073, "rouge1_fmeasure": 0.2848021533685038, "rouge1_fmeasure_stderr": 0.0017517841909149951, "rouge1_precision": 0.22830891168453196, "rouge1_precision_stderr": 0.0020226351669978943, "rouge1_recall": 0.430501449249562, "rouge1_recall_stderr": 0.0025067528428449337, "rouge2_fmeasure": 0.11056535384060841, "rouge2_fmeasure_stderr": 0.0012335424952574436, "rouge2_precision": 0.08874046699895509, "rouge2_precision_stderr": 0.0012536346039166443, "rouge2_recall": 0.17058058024587597, "rouge2_recall_stderr": 0.0019277334580117154, "rougeL_fmeasure": 0.22429066792419844, "rougeL_fmeasure_stderr": 0.0013639521320318918, "rougeL_precision": 0.17874631886223866, "rougeL_precision_stderr": 0.0015432601430013146, "rougeL_recall": 0.34228892513027326, "rougeL_recall_stderr": 0.0021544507147917644, "rougeLsum_fmeasure": 0.23961627743436656, "rougeLsum_fmeasure_stderr": 0.0016466360617377184, "rougeLsum_precision": 0.19159590399736812, "rougeLsum_precision_stderr": 0.0017744554514183184, "rougeLsum_recall": 0.36333660692954056, "rougeLsum_recall_stderr": 0.0024452838301491264}}, "3": {"generate_text_restaurant": {"bleu": 5.161685848623118, "bleu_stderr": 0.07262509824163077, "rouge1_fmeasure": 0.28625759764760766, "rouge1_fmeasure_stderr": 0.0017505915200592458, "rouge1_precision": 0.2250406541329284, "rouge1_precision_stderr": 0.0018984959829563015, "rouge1_recall": 0.4401409797987255, "rouge1_recall_stderr": 0.0024818459349912466, "rouge2_fmeasure": 0.11431119935407852, "rouge2_fmeasure_stderr": 0.0012264659705919982, "rouge2_precision": 0.08992659254313957, "rouge2_precision_stderr": 0.0012057214319225603, "rouge2_recall": 0.17962663745940138, "rouge2_recall_stderr": 0.00190969756064409, "rougeL_fmeasure": 0.22718964393483773, "rougeL_fmeasure_stderr": 0.001341523865438878, "rougeL_precision": 0.17814189014708015, "rougeL_precision_stderr": 0.001501724354676948, "rougeL_recall": 0.3526106772291693, "rougeL_recall_stderr": 0.0021197068010549917, "rougeLsum_fmeasure": 0.24420233251967818, "rougeLsum_fmeasure_stderr": 0.0016511867365175956, "rougeLsum_precision": 0.19224724023096493, "rougeLsum_precision_stderr": 0.0017539464959385562, "rougeLsum_recall": 0.375736139296112, "rougeLsum_recall_stderr": 0.0024062560460738677}}, "4": {"generate_text_restaurant": {"bleu": 5.3863626535773195, "bleu_stderr": 0.08316568360369772, "rouge1_fmeasure": 0.2884803003096355, "rouge1_fmeasure_stderr": 0.0017316301619347632, "rouge1_precision": 0.22591638424042498, "rouge1_precision_stderr": 0.001851012114615343, "rouge1_recall": 0.44465520609703646, "rouge1_recall_stderr": 0.0024822890206687306, "rouge2_fmeasure": 0.11718583569111816, "rouge2_fmeasure_stderr": 0.00121705170719205, "rouge2_precision": 0.09137947270797166, "rouge2_precision_stderr": 0.0011328131792298333, "rouge2_recall": 0.18516155808078238, "rouge2_recall_stderr": 0.0019428991404911535, "rougeL_fmeasure": 0.22838715083098254, "rougeL_fmeasure_stderr": 0.0013209819868746765, "rougeL_precision": 0.17791538730013262, "rougeL_precision_stderr": 0.001385852845968636, "rougeL_recall": 0.3555171974183999, "rougeL_recall_stderr": 0.0021223337675852177, "rougeLsum_fmeasure": 0.2473033223648628, "rougeLsum_fmeasure_stderr": 0.001629820147671333, "rougeLsum_precision": 0.1934093946653807, "rougeLsum_precision_stderr": 0.0016535132345320634, "rougeLsum_recall": 0.3819852960374735, "rougeLsum_recall_stderr": 0.0024230711787691338}}, "5": {"generate_text_restaurant": {"bleu": 5.218311341485651, "bleu_stderr": 0.08555182976780383, "rouge1_fmeasure": 0.2851279405049657, "rouge1_fmeasure_stderr": 0.0017156941599383252, "rouge1_precision": 0.22420804212245024, "rouge1_precision_stderr": 0.0018931092685607832, "rouge1_recall": 0.43645148946569756, "rouge1_recall_stderr": 0.0023925455584187143, "rouge2_fmeasure": 0.11398867145332987, "rouge2_fmeasure_stderr": 0.0012184034191725704, "rouge2_precision": 0.08976861428854209, "rouge2_precision_stderr": 0.0012265411317482072, "rouge2_recall": 0.17860416167471355, "rouge2_recall_stderr": 0.001894485841362118, "rougeL_fmeasure": 0.22589371892600646, "rougeL_fmeasure_stderr": 0.001329494456764217, "rougeL_precision": 0.17705341704222277, "rougeL_precision_stderr": 0.001496237569767933, "rougeL_recall": 0.3489555989991215, "rougeL_recall_stderr": 0.0020756478234175003, "rougeLsum_fmeasure": 0.24529704048909337, "rougeLsum_fmeasure_stderr": 0.0016364362199438327, "rougeLsum_precision": 0.19291128629856713, "rougeLsum_precision_stderr": 0.001743268774937326, "rougeLsum_recall": 0.3757535087761027, "rougeLsum_recall_stderr": 0.0023376729302477164}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.2992802626075217, "bleu_stderr": 0.08613536173053919, "rouge1_fmeasure": 0.19317514090993446, "rouge1_fmeasure_stderr": 0.0022112014874136276, "rouge1_precision": 0.1404335293516036, "rouge1_precision_stderr": 0.0018475752933584198, "rouge1_recall": 0.33304948876480905, "rouge1_recall_stderr": 0.0038506848151682277, "rouge2_fmeasure": 0.03629759048462241, "rouge2_fmeasure_stderr": 0.0012314297081491255, "rouge2_precision": 0.026070215267481753, "rouge2_precision_stderr": 0.0009166794828332532, "rouge2_recall": 0.06470743754786817, "rouge2_recall_stderr": 0.0022637761051235894, "rougeL_fmeasure": 0.14245726390092303, "rougeL_fmeasure_stderr": 0.001599761390324437, "rougeL_precision": 0.1032551941800083, "rougeL_precision_stderr": 0.0013020422069113654, "rougeL_recall": 0.24743139771736608, "rougeL_recall_stderr": 0.0029799847541024864, "rougeLsum_fmeasure": 0.1525513019630977, "rougeLsum_fmeasure_stderr": 0.0018062738518410612, "rougeLsum_precision": 0.11056793408323284, "rougeLsum_precision_stderr": 0.0014447008795606224, "rougeLsum_recall": 0.2644863518283602, "rougeLsum_recall_stderr": 0.003301240029680331}}, "1": {"article_DOC_summary": {"bleu": 0.9392811645900702, "bleu_stderr": 0.07096662177652757, "rouge1_fmeasure": 0.163100228567693, "rouge1_fmeasure_stderr": 0.002132266466808726, "rouge1_precision": 0.11583572927874138, "rouge1_precision_stderr": 0.0015868267173138404, "rouge1_recall": 0.28673470669230483, "rouge1_recall_stderr": 0.003637777293225723, "rouge2_fmeasure": 0.02461427079155061, "rouge2_fmeasure_stderr": 0.001063162698284129, "rouge2_precision": 0.01724716231152785, "rouge2_precision_stderr": 0.0007449366916925016, "rouge2_recall": 0.04477737050796163, "rouge2_recall_stderr": 0.00198811760305303, "rougeL_fmeasure": 0.12465414516933276, "rougeL_fmeasure_stderr": 0.001518543329628805, "rougeL_precision": 0.08830410964622547, "rougeL_precision_stderr": 0.0011164040071930121, "rougeL_recall": 0.22077364895161825, "rougeL_recall_stderr": 0.0027438079045214113, "rougeLsum_fmeasure": 0.13165914823095848, "rougeLsum_fmeasure_stderr": 0.001722148826191323, "rougeLsum_precision": 0.09327309336629477, "rougeLsum_precision_stderr": 0.001264500539576057, "rougeLsum_recall": 0.23298075051437098, "rougeLsum_recall_stderr": 0.003053175396768166}}, "2": {"article_DOC_summary": {"bleu": 0.8642738469290718, "bleu_stderr": 0.0828969271702355, "rouge1_fmeasure": 0.16310151647769613, "rouge1_fmeasure_stderr": 0.0021173776446693038, "rouge1_precision": 0.11587525551966481, "rouge1_precision_stderr": 0.0016045754710452714, "rouge1_recall": 0.2874887710310145, "rouge1_recall_stderr": 0.003567488833961318, "rouge2_fmeasure": 0.02540910163910677, "rouge2_fmeasure_stderr": 0.0010850659455729865, "rouge2_precision": 0.01786609643978251, "rouge2_precision_stderr": 0.0007624665922748118, "rouge2_recall": 0.046073666078135844, "rouge2_recall_stderr": 0.00202411128686605, "rougeL_fmeasure": 0.12516134814219937, "rougeL_fmeasure_stderr": 0.0015660208564047945, "rougeL_precision": 0.08869240853211423, "rougeL_precision_stderr": 0.0011665769716760525, "rougeL_recall": 0.2219053477816373, "rougeL_recall_stderr": 0.002750331221052164, "rougeLsum_fmeasure": 0.13195206984139488, "rougeLsum_fmeasure_stderr": 0.0017467533202419128, "rougeLsum_precision": 0.09346436388002839, "rougeLsum_precision_stderr": 0.0012938167406065764, "rougeLsum_recall": 0.23423731441915813, "rougeLsum_recall_stderr": 0.003085268456864704}}, "3": {"article_DOC_summary": {"bleu": 0.8836853896564532, "bleu_stderr": 0.04539990589714401, "rouge1_fmeasure": 0.15604881038304613, "rouge1_fmeasure_stderr": 0.0022637041314365453, "rouge1_precision": 0.11296838065461887, "rouge1_precision_stderr": 0.0017763597852222038, "rouge1_recall": 0.2719068297050645, "rouge1_recall_stderr": 0.0038490332935536237, "rouge2_fmeasure": 0.023753467717060665, "rouge2_fmeasure_stderr": 0.0010443537949278742, "rouge2_precision": 0.01707269817022361, "rouge2_precision_stderr": 0.0007693549928763936, "rouge2_recall": 0.042123589858273434, "rouge2_recall_stderr": 0.0018755138592056807, "rougeL_fmeasure": 0.11872182977619025, "rougeL_fmeasure_stderr": 0.0016793576149961092, "rougeL_precision": 0.08602111381227089, "rougeL_precision_stderr": 0.001348786781692891, "rougeL_recall": 0.20806883128782105, "rougeL_recall_stderr": 0.0029718527370379577, "rougeLsum_fmeasure": 0.12609518726408814, "rougeLsum_fmeasure_stderr": 0.0018237508130951488, "rougeLsum_precision": 0.09123263400217625, "rougeLsum_precision_stderr": 0.0014417280224893359, "rougeLsum_recall": 0.22083691751530135, "rougeLsum_recall_stderr": 0.0031880991373431033}}, "4": {"article_DOC_summary": {"bleu": 0.32264946943694406, "bleu_stderr": 0.06831405512505326, "rouge1_fmeasure": 0.04091181078946866, "rouge1_fmeasure_stderr": 0.0022902327278297046, "rouge1_precision": 0.034882897379201874, "rouge1_precision_stderr": 0.002246767493274493, "rouge1_recall": 0.06473914976317797, "rouge1_recall_stderr": 0.0037002010817473985, "rouge2_fmeasure": 0.0052797964519696655, "rouge2_fmeasure_stderr": 0.0005471044968877006, "rouge2_precision": 0.0038285864418821543, "rouge2_precision_stderr": 0.00040689869864601153, "rouge2_recall": 0.009305544911384899, "rouge2_recall_stderr": 0.0009789224679047535, "rougeL_fmeasure": 0.03128707048743581, "rougeL_fmeasure_stderr": 0.0017437540939162011, "rougeL_precision": 0.027308146633009903, "rougeL_precision_stderr": 0.0019083153741966364, "rougeL_recall": 0.04967049431208105, "rougeL_recall_stderr": 0.0028488023843374856, "rougeLsum_fmeasure": 0.03330241832085698, "rougeLsum_fmeasure_stderr": 0.0018775032498108398, "rougeLsum_precision": 0.028950850747643437, "rougeLsum_precision_stderr": 0.0019932883821356198, "rougeLsum_recall": 0.05263176539885643, "rougeLsum_recall_stderr": 0.003033293906854166}}, "5": {"article_DOC_summary": {"bleu": 1.7543632002989705e-39, "bleu_stderr": 1.694640730371467e-33, "rouge1_fmeasure": 0.002011613476498758, "rouge1_fmeasure_stderr": 0.0005611516641301552, "rouge1_precision": 0.002234714565312147, "rouge1_precision_stderr": 0.0006324566810963234, "rouge1_recall": 0.0019083246709728258, "rouge1_recall_stderr": 0.0005363735849273349, "rouge2_fmeasure": 0.00025972087637987314, "rouge2_fmeasure_stderr": 0.00018245934977293284, "rouge2_precision": 0.000275577641004944, "rouge2_precision_stderr": 0.00018655929326294164, "rouge2_recall": 0.00024871355060034306, "rouge2_recall_stderr": 0.00018003279128987707, "rougeL_fmeasure": 0.0015954209721237727, "rougeL_fmeasure_stderr": 0.00046728726635727905, "rougeL_precision": 0.0017513556534527388, "rougeL_precision_stderr": 0.0005186881670205111, "rougeL_recall": 0.0015379808798967414, "rougeL_recall_stderr": 0.00045866786099632605, "rougeLsum_fmeasure": 0.0017182753671868714, "rougeLsum_fmeasure_stderr": 0.0004901161371032653, "rougeLsum_precision": 0.001897742561259706, "rougeLsum_precision_stderr": 0.0005481199006190125, "rougeLsum_recall": 0.0016448900434096786, "rougeLsum_recall_stderr": 0.0004764592460236093}}}} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..24335bb30451bd2148d8d165d515c6897510117e --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3066098749246226, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.026080136938068845 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07111826415088063, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002839089906272575 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2506712149564081, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004757508557066865 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08751164861028739, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00199981726737483 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03319077620530337, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0020231897791775106 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11077608891772334, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003107351453235033 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03876750875187201, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001265364536751268 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06647718723035836, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0026791734683438173 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.23570838504150982, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00455197819987753 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08166593395748795, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018388377390052121 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06672890451920119, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002733920332843438 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.23129644774314756, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0043201593384418835 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08123251691641209, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018438238359305395 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e409d98c2da7c97d3ef71b4b496ccdb94d688ed9 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3038192608605564, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.015699254374158 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05683590873929071, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0020467792157088907 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.27017378109951967, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004955059066352234 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08003564917768238, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016231021328505706 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02302654571104229, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0013956717371657963 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11037888710881248, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0030905387552418112 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03157133816619759, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009524060107538227 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05138484982672407, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0019566614919068054 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24316258353203007, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004414830331308628 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07172579578796798, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014182749325865474 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05290704322980144, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0019882546868578662 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.24942020154922606, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0044964221550096405 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07395133279168084, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014906191471968171 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..9301ab60334c062b6a82a478846b23b5f05b7042 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.2987651957407001, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.01165146487326007 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05700016441399435, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017866333928080581 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2804134367029925, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004805713426369978 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.0831895052852721, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001625324041245366 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02233985054458201, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010710584040813141 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11320206879663894, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.002939251451992755 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.032089824292963406, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009447259591619087 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.04971200204444394, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015276050991763481 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24706303672621477, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004167944129872773 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07258794061798622, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013375852482102129 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05309006495197277, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016898819992046204 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2605549805843784, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004415202735971505 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.0771940777807749, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014906191322966035 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2be286b17bfe348c411edb2e0e46a65011156af7 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3178292125394837, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.016436461817007326 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05949762170434375, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002164217791856107 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2804633597246112, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004772273934843173 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08130575650688132, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001537824456242504 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02315468230294224, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0013116150015292844 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11210805274384686, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0030446087077799903 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03098393961344455, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009090838201088959 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05296448349205633, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002039688636224555 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24654397231374384, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004152222617956148 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07145815124416759, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013532821520358354 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05596829767493985, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0021073938497608454 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2610555009310582, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004427499077140127 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07576475402518883, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014334163239098205 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9b403095273d2f69e41611bb7efe26c9fa1799c3 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.33395098766218884, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.018968072553356623 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05735023477794692, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018410250349017107 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.29141762974212615, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004822950393157349 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08367597785312914, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016033089150747774 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.021651705429468177, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010514293026879199 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11750125883404142, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003178578433572342 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.031540027671483784, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009467316903388299 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.050054640877740926, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016864461898684513 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.25450526989064276, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004210704440467058 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07260423911237245, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001376149178581389 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05345237810332766, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017804800879000749 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2697483182511519, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004417715268392961 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07753657862492522, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001496405647152453 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..1b4950e72c9fe81afe43e70b735f15619ae61c55 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3641656854611542, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.015309152040195284 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.052896109217414104, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014365647910545604 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.28995885739987826, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00491862249100831 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.0809120070880779, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0014755261393375114 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.01993001210350518, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007373235006634328 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11732616625283977, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0031965230579063257 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.030494115579364812, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008357516400780779 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.04580220322739789, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001313492675076717 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.25087552702336663, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004197343182524436 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.06970781602649807, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012557281083211698 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.04920701939583041, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013657560657982203 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2686976948346208, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00450965297817273 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.0750837322403333, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001370229544506872 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..2573f14b2ba49b076dc0dfab1005fa08a757c231 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.153949065103856, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018954240620966882 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.25650646122704474, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0024640946950302985 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17763908527361025, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017411319281415913 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.028019269400656518, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007188326863079863 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04807149188073896, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012737937496356626 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03228562656211838, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007610456704112464 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.114473205278599, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013050419999849348 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1979090080195594, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019738106671277266 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1335773049328249, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001206400625022134 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1434687817382672, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001762712661710752 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24013798061889524, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002330459097368292 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16579309345906998, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016200879357240658 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.3310013488043524, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.051303312771233796 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..46ff15181534542bebe68fa963bedecef22dd0cb --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15222498270112908, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018427545457994695 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2575304318026435, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025171368376624634 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17784343637401165, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017678913033546437 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.027223166689333656, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007022412791947103 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.047627933423561246, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012809278259731988 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03198373436508538, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007797542212099719 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10932432127036033, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001193214863192186 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19223797000244636, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.001923076446257654 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1293204461841411, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001171111199270059 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1432522940492175, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017229652479762334 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2435323142827951, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002380294263101675 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16757050221415196, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016483223875673962 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.538506754528524, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05237098925801456 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a7fb163b98df5c2e14d790864e69af26b3aa34ab --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1563882321550081, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001888617387583986 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.26533453283498676, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025530833044838525 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1825901932807019, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001772393389777701 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03007920986659565, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007656205465392793 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05242348060271486, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001402785333640821 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03484256216837846, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008050464414919185 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11302771471874037, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012603520129098162 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19883145591680731, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.001967593430993135 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.133378449269488, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0011786586689251871 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14736580481316963, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001773298946199036 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.25099172388853663, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024263653927730773 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17216601216038344, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016569952491396495 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.641398523262805, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05167522892405418 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..9d60edd2b5d893482f42cfc41cf9a3f285647e08 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1389473709497086, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002165945649654676 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.22609159173620905, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0029302654026930365 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.15630117454287198, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002033104554438234 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.026390272714025626, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007567994736605611 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04479360431887114, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013217939246997325 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.02997981495146458, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000789727045647715 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1008235900865201, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015515937317845793 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.16915259930611842, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002256313909124414 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.11400981222806023, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014106173327737745 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13075025696794762, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020447039924209433 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.21298194277055252, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027618131658537198 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.14696382199884428, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019053060135896015 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.6905078353779432, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07249934930658058 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..74d4d0d06559c257219aab0c07a39b4ca8f73b2d --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.0489492492227955, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001789814805368641 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08138629581304692, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002787495081772674 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.053849493676637585, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018128550224799451 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.00954245354371464, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000496033168499096 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.017770514262613592, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001037990108744839 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.010951183251337409, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000542318137546649 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.036730466496340326, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013603756574255225 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06226680749750502, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002169104206622538 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04018322578320604, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013246122432655602 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.04606259413041724, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016946531131761852 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.07642507746995442, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026253735820234 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05051235209315841, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017010930529641197 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.39343180321276056, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0293119272772715 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ceaeb98be182e949fd0cde79468024a9f4b648ad --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.00785532086822979, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008059057817636163 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.012189729776176633, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0011529440251866266 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.008211770721120311, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0007739119234145405 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.001629059190316381, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00023332897761005325 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0026264060986572716, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00038760636790030855 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0016759752492624186, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00021435787709352103 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006024210894010907, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.000610190662185335 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.009693715133781285, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009327234614976355 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006313837482340284, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0005834402713093119 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.007292999371042805, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007486511125870423 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.01142399455584086, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0010918019151945164 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.007631652279250868, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007207775362203403 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 4.795621548580966e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 9.116423959336365e-07 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0de7da13b327d665f4da386d139bc3b70611a1d1 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 1.3467292138388522, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.0636854285236688 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.21376122377294582, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003423965804716776 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.11826204808312468, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0016068929332226103 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.12012011760848791, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0013303613929234116 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.04464223015901598, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0015055825472803579 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.024459729176383012, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0007148574718681848 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.02367441172991871, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0006343126685728484 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.17720781770238822, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0025232418694504655 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.10503799964127797, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.001452728215385968 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.10396010404779424, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0010907224654039642 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.18148501626393876, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0027979704321773107 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.10087939658175359, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0014051358188386478 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.10215080373243925, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001109159488438079 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..3335aad9bb78f2e298475dfec73520f6e48f2437 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 4.5480283931845324, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.05660434588182871 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.23525526703689217, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002224131117862929 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.41213522865304736, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026261778490009914 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.28179765051154215, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018423691903722364 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.08756330373099659, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.001382664098826369 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.15485417637322493, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001859705859804789 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.10436721293825027, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0012564399976213632 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.18389946486758244, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0017430632737902262 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3260598830971049, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0021720923944008705 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2209222812840664, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014041408204809602 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.19611766071180928, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002000511520927801 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3429462721297835, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002447036789471601 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.23443730171613159, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016999346317063447 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6a05fbc46b209409b70b39a98a7f84b3bbb70c4b --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 4.919099078160439, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07401079447832073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.22830891168453196, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0020226351669978943 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.430501449249562, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025067528428449337 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.2848021533685038, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0017517841909149951 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.08874046699895509, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0012536346039166443 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.17058058024587597, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019277334580117154 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.11056535384060841, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0012335424952574436 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.17874631886223866, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0015432601430013146 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.34228892513027326, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0021544507147917644 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.22429066792419844, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0013639521320318918 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.19159590399736812, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0017744554514183184 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.36333660692954056, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0024452838301491264 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.23961627743436656, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016466360617377184 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..7ace362598cc29601f996466ebb7d66f0e418966 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.161685848623118, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07262509824163077 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.2250406541329284, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0018984959829563015 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4401409797987255, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0024818459349912466 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.28625759764760766, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0017505915200592458 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.08992659254313957, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0012057214319225603 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.17962663745940138, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00190969756064409 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.11431119935407852, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0012264659705919982 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.17814189014708015, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.001501724354676948 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3526106772291693, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0021197068010549917 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.22718964393483773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001341523865438878 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.19224724023096493, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0017539464959385562 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.375736139296112, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0024062560460738677 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.24420233251967818, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016511867365175956 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a915d24cf180ebc464583804ef27aa47b136ec5d --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.3863626535773195, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.08316568360369772 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.22591638424042498, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.001851012114615343 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.44465520609703646, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0024822890206687306 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.2884803003096355, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0017316301619347632 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.09137947270797166, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0011328131792298333 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.18516155808078238, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019428991404911535 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.11718583569111816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00121705170719205 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.17791538730013262, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.001385852845968636 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3555171974183999, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0021223337675852177 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.22838715083098254, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0013209819868746765 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.1934093946653807, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0016535132345320634 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3819852960374735, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0024230711787691338 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2473033223648628, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001629820147671333 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a027cab42b8c74436d70c0cf6e8340efe064d709 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.218311341485651, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.08555182976780383 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.22420804212245024, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0018931092685607832 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.43645148946569756, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0023925455584187143 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.2851279405049657, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0017156941599383252 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.08976861428854209, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0012265411317482072 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.17860416167471355, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001894485841362118 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.11398867145332987, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0012184034191725704 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.17705341704222277, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.001496237569767933 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3489555989991215, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0020756478234175003 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.22589371892600646, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001329494456764217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.19291128629856713, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.001743268774937326 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3757535087761027, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0023376729302477164 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.24529704048909337, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016364362199438327 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..94e4efb80faebdb5834e356ed0574011c0fddba6 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1404335293516036, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018475752933584198 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.33304948876480905, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0038506848151682277 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.19317514090993446, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022112014874136276 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.026070215267481753, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009166794828332532 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06470743754786817, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0022637761051235894 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03629759048462241, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012314297081491255 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.1032551941800083, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013020422069113654 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24743139771736608, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0029799847541024864 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14245726390092303, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001599761390324437 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.11056793408323284, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014447008795606224 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2644863518283602, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003301240029680331 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1525513019630977, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018062738518410612 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.2992802626075217, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08613536173053919 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..eb75844a5f6bcd76962aae683ab918de7558b34b --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11583572927874138, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0015868267173138404 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.28673470669230483, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003637777293225723 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.163100228567693, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002132266466808726 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01724716231152785, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007449366916925016 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.04477737050796163, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00198811760305303 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.02461427079155061, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001063162698284129 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08830410964622547, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0011164040071930121 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.22077364895161825, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0027438079045214113 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12465414516933276, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001518543329628805 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09327309336629477, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001264500539576057 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23298075051437098, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003053175396768166 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13165914823095848, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.001722148826191323 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.9392811645900702, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07096662177652757 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..10d958abe702872e7f5a87c06cb5437e61f32052 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11587525551966481, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0016045754710452714 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2874887710310145, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003567488833961318 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.16310151647769613, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0021173776446693038 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01786609643978251, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007624665922748118 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.046073666078135844, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00202411128686605 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.02540910163910677, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0010850659455729865 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08869240853211423, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0011665769716760525 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2219053477816373, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002750331221052164 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12516134814219937, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0015660208564047945 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09346436388002839, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0012938167406065764 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23423731441915813, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003085268456864704 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13195206984139488, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017467533202419128 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.8642738469290718, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0828969271702355 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..fbe8f2d53902547fb32d4a27f4d7e2172d895a11 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11296838065461887, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017763597852222038 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2719068297050645, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0038490332935536237 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.15604881038304613, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022637041314365453 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01707269817022361, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007693549928763936 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.042123589858273434, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0018755138592056807 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.023753467717060665, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0010443537949278742 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08602111381227089, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001348786781692891 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20806883128782105, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0029718527370379577 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11872182977619025, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016793576149961092 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09123263400217625, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014417280224893359 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22083691751530135, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0031880991373431033 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12609518726408814, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018237508130951488 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.8836853896564532, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.04539990589714401 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d6e2201616425d196e4500d22140d3ee7238488e --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.034882897379201874, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002246767493274493 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.06473914976317797, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0037002010817473985 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04091181078946866, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022902327278297046 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0038285864418821543, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00040689869864601153 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.009305544911384899, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0009789224679047535 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0052797964519696655, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0005471044968877006 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.027308146633009903, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0019083153741966364 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.04967049431208105, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0028488023843374856 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03128707048743581, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017437540939162011 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.028950850747643437, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0019932883821356198 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.05263176539885643, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003033293906854166 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03330241832085698, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018775032498108398 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.32264946943694406, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06831405512505326 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f41b190f87fb6646787dfe65a8f4b579902108e7 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/generation/slim.4b284b1b9c4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.002234714565312147, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0006324566810963234 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0019083246709728258, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0005363735849273349 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002011613476498758, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0005611516641301552 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.000275577641004944, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00018655929326294164 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00024871355060034306, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00018003279128987707 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00025972087637987314, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00018245934977293284 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0017513556534527388, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0005186881670205111 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0015379808798967414, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00045866786099632605 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0015954209721237727, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00046728726635727905 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.001897742561259706, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0005481199006190125 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0016448900434096786, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0004764592460236093 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0017182753671868714, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0004901161371032653 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.7543632002989705e-39, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.694640730371467e-33 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_0.csv b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..7d0847d87a9a27236009bd3bf66a727d04cc2229 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.329,0.014865395385928354,0 +anli_r2,acc,0.353,0.015120172605483694,0 +anli_r3,acc,0.3375,0.01365589718546366,0 +arc_challenge,acc,0.22696245733788395,0.012240491536132865,0 +arc_challenge,acc_norm,0.2627986348122867,0.012862523175351333,0 +arc_easy,acc,0.49747474747474746,0.010259652668783474,0 +arc_easy,acc_norm,0.43813131313131315,0.010180937100600078,0 +boolq,acc,0.4923547400611621,0.0087440326197193,1 +cb,acc,0.5,0.06741998624632421,1 +cb,f1,0.24617886178861784,,1 +copa,acc,0.7,0.046056618647183814,0 +hellaswag,acc,0.3990240987851026,0.004886969266944278,0 +hellaswag,acc_norm,0.4960167297351125,0.00498962306877881,0 +piqa,acc,0.6953210010881393,0.010738889044325161,0 +piqa,acc_norm,0.7094668117519043,0.010592765034696536,0 +rte,acc,0.48014440433212996,0.0300727231673172,0 +sciq,acc,0.72,0.014205696104091503,0 +sciq,acc_norm,0.627,0.015300493622922814,0 +storycloze_2016,acc,0.6536611437733832,0.011002874026446419,0 +winogrande,acc,0.5169692186266772,0.014044390401612972,0 diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_0.json b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_0.json new file mode 100644 index 0000000000000000000000000000000000000000..719702069bd9711ca913df3ecac68d526eb6b9df --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928354 + }, + "anli_r2": { + "acc": 0.353, + "acc_stderr": 0.015120172605483694 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.01365589718546366 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.24617886178861784 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + }, + "hellaswag": { + "acc": 0.3990240987851026, + "acc_stderr": 0.004886969266944278, + "acc_norm": 0.4960167297351125, + "acc_norm_stderr": 0.00498962306877881 + }, + "rte": { + "acc": 0.48014440433212996, + "acc_stderr": 0.0300727231673172 + }, + "winogrande": { + "acc": 0.5169692186266772, + "acc_stderr": 0.014044390401612972 + }, + "storycloze_2016": { + "acc": 0.6536611437733832, + "acc_stderr": 0.011002874026446419 + }, + "boolq": { + "acc": 0.4923547400611621, + "acc_stderr": 0.0087440326197193 + }, + "arc_easy": { + "acc": 0.49747474747474746, + "acc_stderr": 0.010259652668783474, + "acc_norm": 0.43813131313131315, + "acc_norm_stderr": 0.010180937100600078 + }, + "arc_challenge": { + "acc": 0.22696245733788395, + "acc_stderr": 0.012240491536132865, + "acc_norm": 0.2627986348122867, + "acc_norm_stderr": 0.012862523175351333 + }, + "sciq": { + "acc": 0.72, + "acc_stderr": 0.014205696104091503, + "acc_norm": 0.627, + "acc_norm_stderr": 0.015300493622922814 + }, + "piqa": { + "acc": 0.6953210010881393, + "acc_stderr": 0.010738889044325161, + "acc_norm": 0.7094668117519043, + "acc_norm_stderr": 0.010592765034696536 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_1.csv b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..34443c262ca7a6265718e2b0b1f88cc25f9dc4d7 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.339,0.014976758771620345,0 +anli_r2,acc,0.329,0.014865395385928364,0 +anli_r3,acc,0.33916666666666667,0.013672343491681822,0 +arc_challenge,acc,0.24658703071672355,0.012595726268790127,0 +arc_challenge,acc_norm,0.26621160409556316,0.012915774781523223,0 +arc_easy,acc,0.49747474747474746,0.010259652668783469,0 +arc_easy,acc_norm,0.4675925925925926,0.010238210368801886,0 +boolq,acc,0.4782874617737003,0.008736805647519946,1 +cb,acc,0.5178571428571429,0.06737697508644647,1 +cb,f1,0.25267737617135205,,1 +copa,acc,0.7,0.046056618647183814,0 +hellaswag,acc,0.4008165704043019,0.0048906236932436216,0 +hellaswag,acc_norm,0.4962158932483569,0.004989638507409917,0 +piqa,acc,0.6953210010881393,0.010738889044325161,0 +piqa,acc_norm,0.7002176278563657,0.01068968696713809,0 +rte,acc,0.44765342960288806,0.02993107036293953,0 +sciq,acc,0.727,0.014095022868717598,0 +sciq,acc_norm,0.68,0.014758652303574874,0 +storycloze_2016,acc,0.6483164083377873,0.011042025772682543,0 +winogrande,acc,0.5185477505919495,0.014042813708888378,0 diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_1.json b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_1.json new file mode 100644 index 0000000000000000000000000000000000000000..025ad30b35b51eac3565cf78e4ecbd80f54d0bbc --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.339, + "acc_stderr": 0.014976758771620345 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928364 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.013672343491681822 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.25267737617135205 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + }, + "hellaswag": { + "acc": 0.4008165704043019, + "acc_stderr": 0.0048906236932436216, + "acc_norm": 0.4962158932483569, + "acc_norm_stderr": 0.004989638507409917 + }, + "rte": { + "acc": 0.44765342960288806, + "acc_stderr": 0.02993107036293953 + }, + "winogrande": { + "acc": 0.5185477505919495, + "acc_stderr": 0.014042813708888378 + }, + "storycloze_2016": { + "acc": 0.6483164083377873, + "acc_stderr": 0.011042025772682543 + }, + "boolq": { + "acc": 0.4782874617737003, + "acc_stderr": 0.008736805647519946 + }, + "arc_easy": { + "acc": 0.49747474747474746, + "acc_stderr": 0.010259652668783469, + "acc_norm": 0.4675925925925926, + "acc_norm_stderr": 0.010238210368801886 + }, + "arc_challenge": { + "acc": 0.24658703071672355, + "acc_stderr": 0.012595726268790127, + "acc_norm": 0.26621160409556316, + "acc_norm_stderr": 0.012915774781523223 + }, + "sciq": { + "acc": 0.727, + "acc_stderr": 0.014095022868717598, + "acc_norm": 0.68, + "acc_norm_stderr": 0.014758652303574874 + }, + "piqa": { + "acc": 0.6953210010881393, + "acc_stderr": 0.010738889044325161, + "acc_norm": 0.7002176278563657, + "acc_norm_stderr": 0.01068968696713809 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_2.csv b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..2d3935a8dacf3710c667f7977bebf65596dad8bd --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.33,0.014876872027456734,0 +anli_r2,acc,0.354,0.015129868238451773,0 +anli_r3,acc,0.36583333333333334,0.013910212062701167,0 +arc_challenge,acc,0.25,0.012653835621466646,0 +arc_challenge,acc_norm,0.2645051194539249,0.012889272949313368,0 +arc_easy,acc,0.4936868686868687,0.010258965668044432,0 +arc_easy,acc_norm,0.4722222222222222,0.01024393828588112,0 +boolq,acc,0.4691131498470948,0.00872835350662247,1 +cb,acc,0.48214285714285715,0.0673769750864465,1 +cb,f1,0.2396327951883507,,1 +copa,acc,0.66,0.04760952285695238,0 +hellaswag,acc,0.40021907986456884,0.0048894131262087765,0 +hellaswag,acc_norm,0.4945230033857797,0.0049894820406101124,0 +piqa,acc,0.6974972796517954,0.010717199698083884,0 +piqa,acc_norm,0.7040261153427638,0.010650414317148122,0 +rte,acc,0.48375451263537905,0.030080573208738064,0 +sciq,acc,0.736,0.013946271849440469,0 +sciq,acc_norm,0.687,0.014671272822977886,0 +storycloze_2016,acc,0.6472474612506681,0.011049673577950937,0 +winogrande,acc,0.510655090765588,0.0140492945362904,0 diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_2.json b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2e99163617c10814f6308381d71d0339f9967b80 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.33, + "acc_stderr": 0.014876872027456734 + }, + "anli_r2": { + "acc": 0.354, + "acc_stderr": 0.015129868238451773 + }, + "anli_r3": { + "acc": 0.36583333333333334, + "acc_stderr": 0.013910212062701167 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.2396327951883507 + }, + "copa": { + "acc": 0.66, + "acc_stderr": 0.04760952285695238 + }, + "hellaswag": { + "acc": 0.40021907986456884, + "acc_stderr": 0.0048894131262087765, + "acc_norm": 0.4945230033857797, + "acc_norm_stderr": 0.0049894820406101124 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.510655090765588, + "acc_stderr": 0.0140492945362904 + }, + "storycloze_2016": { + "acc": 0.6472474612506681, + "acc_stderr": 0.011049673577950937 + }, + "boolq": { + "acc": 0.4691131498470948, + "acc_stderr": 0.00872835350662247 + }, + "arc_easy": { + "acc": 0.4936868686868687, + "acc_stderr": 0.010258965668044432, + "acc_norm": 0.4722222222222222, + "acc_norm_stderr": 0.01024393828588112 + }, + "arc_challenge": { + "acc": 0.25, + "acc_stderr": 0.012653835621466646, + "acc_norm": 0.2645051194539249, + "acc_norm_stderr": 0.012889272949313368 + }, + "sciq": { + "acc": 0.736, + "acc_stderr": 0.013946271849440469, + "acc_norm": 0.687, + "acc_norm_stderr": 0.014671272822977886 + }, + "piqa": { + "acc": 0.6974972796517954, + "acc_stderr": 0.010717199698083884, + "acc_norm": 0.7040261153427638, + "acc_norm_stderr": 0.010650414317148122 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_3.csv b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..8e5c5e6da3d2bfba333906723f60e303e6606697 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.337,0.014955087918653586,0 +anli_r2,acc,0.369,0.015266698139154619,0 +anli_r3,acc,0.3541666666666667,0.013811933499570956,0 +arc_challenge,acc,0.24488054607508533,0.012566273985131354,0 +arc_challenge,acc_norm,0.2619453924914676,0.012849054826858117,0 +arc_easy,acc,0.4970538720538721,0.010259605416237575,0 +arc_easy,acc_norm,0.4730639730639731,0.010244884740620087,0 +boolq,acc,0.4712538226299694,0.00873059018871715,1 +cb,acc,0.4642857142857143,0.0672477765493766,1 +cb,f1,0.2330246913580247,,1 +copa,acc,0.71,0.045604802157206845,0 +hellaswag,acc,0.39603664608643696,0.004880726787988637,0 +hellaswag,acc_norm,0.49422425811591314,0.004989448490164425,0 +piqa,acc,0.6926006528835691,0.01076560250693907,0 +piqa,acc_norm,0.6991294885745375,0.010700745724145973,0 +rte,acc,0.48375451263537905,0.030080573208738064,0 +sciq,acc,0.742,0.013842963108656603,0 +sciq,acc_norm,0.694,0.014580006055436969,0 +storycloze_2016,acc,0.6611437733832175,0.010945481921408545,0 +winogrande,acc,0.5146014206787688,0.014046492383275835,0 diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_3.json b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_3.json new file mode 100644 index 0000000000000000000000000000000000000000..08c7e9738decbf84cbec41f865073e8d8c065f09 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.014955087918653586 + }, + "anli_r2": { + "acc": 0.369, + "acc_stderr": 0.015266698139154619 + }, + "anli_r3": { + "acc": 0.3541666666666667, + "acc_stderr": 0.013811933499570956 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.2330246913580247 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + }, + "hellaswag": { + "acc": 0.39603664608643696, + "acc_stderr": 0.004880726787988637, + "acc_norm": 0.49422425811591314, + "acc_norm_stderr": 0.004989448490164425 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5146014206787688, + "acc_stderr": 0.014046492383275835 + }, + "storycloze_2016": { + "acc": 0.6611437733832175, + "acc_stderr": 0.010945481921408545 + }, + "boolq": { + "acc": 0.4712538226299694, + "acc_stderr": 0.00873059018871715 + }, + "arc_easy": { + "acc": 0.4970538720538721, + "acc_stderr": 0.010259605416237575, + "acc_norm": 0.4730639730639731, + "acc_norm_stderr": 0.010244884740620087 + }, + "arc_challenge": { + "acc": 0.24488054607508533, + "acc_stderr": 0.012566273985131354, + "acc_norm": 0.2619453924914676, + "acc_norm_stderr": 0.012849054826858117 + }, + "sciq": { + "acc": 0.742, + "acc_stderr": 0.013842963108656603, + "acc_norm": 0.694, + "acc_norm_stderr": 0.014580006055436969 + }, + "piqa": { + "acc": 0.6926006528835691, + "acc_stderr": 0.01076560250693907, + "acc_norm": 0.6991294885745375, + "acc_norm_stderr": 0.010700745724145973 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_4.csv b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..6dc49ce399756e846d2c08dab463e17f917895cf --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.336,0.014944140233795025,0 +anli_r2,acc,0.339,0.014976758771620347,0 +anli_r3,acc,0.33916666666666667,0.01367234349168182,0 +arc_challenge,acc,0.25853242320819114,0.012794553754288677,0 +arc_challenge,acc_norm,0.2619453924914676,0.012849054826858115,0 +arc_easy,acc,0.502104377104377,0.010259692651537032,0 +arc_easy,acc_norm,0.4684343434343434,0.010239317603199499,0 +boolq,acc,0.4804281345565749,0.008738352682962235,1 +cb,acc,0.48214285714285715,0.0673769750864465,1 +cb,f1,0.2423076923076923,,1 +copa,acc,0.64,0.04824181513244218,0 +hellaswag,acc,0.39563831905994823,0.004879880092103959,0 +hellaswag,acc_norm,0.4970125473013344,0.0049896923443139935,0 +piqa,acc,0.6898803046789989,0.010791876566843054,0 +piqa,acc_norm,0.7007616974972797,0.010684130673134581,0 +rte,acc,0.4729241877256318,0.030052303463143706,0 +sciq,acc,0.753,0.013644675781314128,0 +sciq,acc_norm,0.7,0.014498627873361425,0 +storycloze_2016,acc,0.6531266702298236,0.011006857922124124,0 +winogrande,acc,0.5201262825572218,0.014041096664344329,0 diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_4.json b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_4.json new file mode 100644 index 0000000000000000000000000000000000000000..496356f261ea29f8491299fa229264f01fae402c --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.336, + "acc_stderr": 0.014944140233795025 + }, + "anli_r2": { + "acc": 0.339, + "acc_stderr": 0.014976758771620347 + }, + "anli_r3": { + "acc": 0.33916666666666667, + "acc_stderr": 0.01367234349168182 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.2423076923076923 + }, + "copa": { + "acc": 0.64, + "acc_stderr": 0.04824181513244218 + }, + "hellaswag": { + "acc": 0.39563831905994823, + "acc_stderr": 0.004879880092103959, + "acc_norm": 0.4970125473013344, + "acc_norm_stderr": 0.0049896923443139935 + }, + "rte": { + "acc": 0.4729241877256318, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5201262825572218, + "acc_stderr": 0.014041096664344329 + }, + "storycloze_2016": { + "acc": 0.6531266702298236, + "acc_stderr": 0.011006857922124124 + }, + "boolq": { + "acc": 0.4804281345565749, + "acc_stderr": 0.008738352682962235 + }, + "arc_easy": { + "acc": 0.502104377104377, + "acc_stderr": 0.010259692651537032, + "acc_norm": 0.4684343434343434, + "acc_norm_stderr": 0.010239317603199499 + }, + "arc_challenge": { + "acc": 0.25853242320819114, + "acc_stderr": 0.012794553754288677, + "acc_norm": 0.2619453924914676, + "acc_norm_stderr": 0.012849054826858115 + }, + "sciq": { + "acc": 0.753, + "acc_stderr": 0.013644675781314128, + "acc_norm": 0.7, + "acc_norm_stderr": 0.014498627873361425 + }, + "piqa": { + "acc": 0.6898803046789989, + "acc_stderr": 0.010791876566843054, + "acc_norm": 0.7007616974972797, + "acc_norm_stderr": 0.010684130673134581 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_5.csv b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..8057e400046b01744c52c5b7627425b1c49408d0 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.349,0.015080663991563102,0 +anli_r2,acc,0.345,0.015039986742055237,0 +anli_r3,acc,0.345,0.013728421539454872,0 +arc_challenge,acc,0.2593856655290102,0.012808273573927095,0 +arc_challenge,acc_norm,0.27047781569965873,0.012980954547659556,0 +arc_easy,acc,0.4970538720538721,0.010259605416237575,0 +arc_easy,acc_norm,0.4772727272727273,0.010249179090605976,0 +boolq,acc,0.47003058103975537,0.008729331818314898,1 +cb,acc,0.5,0.06741998624632421,1 +cb,f1,0.26879199874980464,,1 +copa,acc,0.62,0.04878317312145633,0 +hellaswag,acc,0.40001991635132444,0.004889007921214693,0 +hellaswag,acc_norm,0.4993029277036447,0.00498977656227611,0 +piqa,acc,0.691512513601741,0.010776164678037159,0 +piqa,acc_norm,0.6985854189336235,0.01070624824275376,0 +rte,acc,0.5018050541516246,0.030096267148976626,0 +sciq,acc,0.754,0.013626065817750633,0 +sciq,acc_norm,0.711,0.014341711358296181,0 +storycloze_2016,acc,0.6547300908605024,0.010994860223187677,0 +winogrande,acc,0.5185477505919495,0.014042813708888378,0 diff --git a/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_5.json b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9ba61de394f44d68f45f4766f73476c23e154d14 --- /dev/null +++ b/4b284b1b9c4seed1/evaluation/rankeval/4b284b1b9c4seed1_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.349, + "acc_stderr": 0.015080663991563102 + }, + "anli_r2": { + "acc": 0.345, + "acc_stderr": 0.015039986742055237 + }, + "anli_r3": { + "acc": 0.345, + "acc_stderr": 0.013728421539454872 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.26879199874980464 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.40001991635132444, + "acc_stderr": 0.004889007921214693, + "acc_norm": 0.4993029277036447, + "acc_norm_stderr": 0.00498977656227611 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5185477505919495, + "acc_stderr": 0.014042813708888378 + }, + "storycloze_2016": { + "acc": 0.6547300908605024, + "acc_stderr": 0.010994860223187677 + }, + "boolq": { + "acc": 0.47003058103975537, + "acc_stderr": 0.008729331818314898 + }, + "arc_easy": { + "acc": 0.4970538720538721, + "acc_stderr": 0.010259605416237575, + "acc_norm": 0.4772727272727273, + "acc_norm_stderr": 0.010249179090605976 + }, + "arc_challenge": { + "acc": 0.2593856655290102, + "acc_stderr": 0.012808273573927095, + "acc_norm": 0.27047781569965873, + "acc_norm_stderr": 0.012980954547659556 + }, + "sciq": { + "acc": 0.754, + "acc_stderr": 0.013626065817750633, + "acc_norm": 0.711, + "acc_norm_stderr": 0.014341711358296181 + }, + "piqa": { + "acc": 0.691512513601741, + "acc_stderr": 0.010776164678037159, + "acc_norm": 0.6985854189336235, + "acc_norm_stderr": 0.01070624824275376 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e084d8763e294958a88d5e0ebcaa13b379ca679 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0619ab97543c2640642db60edcb0acf5dd4ae82e718cb7d437b2f8e056bc5f2c +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24c67464780e8f5665032ac7792a69605c144f70 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be8d0d3e76a3bd814a72efce2097158d0a9a439da97f0f39d81a3c2e6c131c2e +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60cc4e9ba0c1dfaa2a69ebc10e1e4c3047310def --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d55fcd247f99f387586daf1527b5ebee404a771157305c5f4969a01ff06bc7 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e3cd8a9ca5bf8ffeb9a6b5e8920f1e3ede520f6 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9f1523ff04ae211bc3304a4e8ee13a1214c6d09d815701d7885721833264f46 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9676aabaab68acd07170af8e72f634bd16ebe12f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92c5c6124a63decb02e70e363b0b4f0decf2892fa69507e4c32c332a4459e563 +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4244b4228b0d64aea95ed0762852f3fb5e027a2f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5acac8cb46e80fd916a34e4b5928110be34f8a663d586f417ede28e673458470 +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bccfb762daac340173f29d4f5912bd8bfbd5e474 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63361991baf1706c7b6a61a7e1fffd495caa75c4aa262e3c87b2264de3f202b7 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4209d15ff4507ff3b3a2512cd69c5ba18bede280 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0946f8ff31f91218940297babf5e42e50995a6950de6172bb6afa572ee0ccada +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f3c094a484b3495b91b41babca1c5f002335be8 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd231965025781ed0ede4d5d9c54494a2e3da8d91e2aa189c3ea34cb4a65ac8d +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad6c6ae742456a4196bd75b8927967dd9c74b494 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f6094ea840a0e8ea7a8a5d09f973fb72e83651f9b3cf04b11360b41e94b499 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6db844d090f190951c04d03284fcc3217acdd627 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:261f3efbfb6a66a4780ab83c99ef09518795d38daf10b05fee321cc9d3901819 +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ae5d0c4e9847c96be6c7823a4908b2848f25f8 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d9d35d09cf18a96098d01fc732402fe204deeb370e5252e5c36f613ddb48c13 +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..359d9ca0315af4bd8bf74966ea7720c2fbf02b7c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83e0957320a34fbd0e99a12ca4577030765247a474b19b0395cdbdfb05bc0808 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ebee26b0939b523617757d0837ed18a94d752c6 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cafe14cb5c1ceea9634b35110e208b32fe49001d3fdc111cf2ded48340a1d9f5 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb3593cf10595313836a84e38163d2bf9a2c5081 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0406017b25a04864d53bddfc0e219221c827652fbce4417ceba307dac97a3c4 +size 199058669 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d9a4d313f15cc869116677e0c2c3a91c081f8a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4e24e43dd5fc06ab753893e7c4babc68651e1557d1d0aec63fc1988c67cb40a +size 199058669 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d911ac06b2cdb8f3de6b5e5ed6225c801397c6e8 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d5e818f45a483fa71650dc0e449ba21e9a148b104ec1f9bc16e37c639ba64f +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f5a2e2f63eb45e55782d285080e944f6a1a4ffb --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f2a96c2687487619231af685e4ccc4c14a2d8d6152a8be81a52d96a3bf4cecc +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6ec4bc0324334251afa0be664f5402e8d7c6741 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:197f0abd843afa1e9f62a2e543175ae3de8eee503e9d9708632c15f3b55d48ac +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..691a814eecb10aaa1fbf024d35df11958f3927c1 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37968c3957ae70840b0f79995fc3a12ab0ab808db3fca12cacd5995e40fcbc32 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c522fe668542efa0fd2fbf20494243cef7303099 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a553297d9a069f5f08352d3ee671237e9df5105e5ed69d030a4a1407be12b9c +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ae6c9a9d44205bc0dc45910d9a79fa5941c9935 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:121f0c6664a7fb3d721ba6f1c0d4203d785482a63f4ec78c9371a7881f33b310 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2880b3ca5c9031a9be76641e4afa80bfde7fe090 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6743766fcafaf6caf53fb0a6955d71fa3cbdf1498beba3e1ec7bf8bde2b4de83 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10ede5bfa6fc6e474ea1cef48ce51b38ed4f8369 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:828990050f4e27dd37807fc2a74ccf23ea825e13c9768dcc240062c1e3d5aafd +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25219a3c7aa62f70fb9258414022251f8aae5361 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97ba970019cc52630422399d85f5c80955bb2e55600baf9535ff5d697eec0e48 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf4378970caf60675db53c4bb7c1495ed01e1a15 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba5971095ea6ab137db76e1272477b9267f6148c0214621bc7fa4ae329c15ad4 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe2e33473a95963de82b0260c770dcfba44f2752 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ffc25c5479ce968c71aebe166189983c4020c244a04660210b7ff90a74f5960 +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28862144b6318be563f03bebbb99530255fbe9ea --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae46ebbf828f10f496fefefdaf2bbf5e16848c52ce36d01fc39e4b8b49aef990 +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..422b7fe43d93621d0ffb9dbfe5101c8410b45ccd --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99330c4ee2e29e79beefcca701be18a9af2ff671e9c59bfcb74efbb842082029 +size 199058605 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c45df1b88c05a4367b44fbcb5e5adfaf4811c566 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b23b88d12a593559298bf26a6824e70edbd55826abc41cb29f91f16a087bbfe +size 199058605 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d500c4317f697f2caef31ba311da21ff0818d32 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0728b5233734aa45840eae4842efb2373b4a28702067231046584ce782b36dd7 +size 199058669 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..222484eb1a1b99575d2b829dc69a1276f8d58e82 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8549b59bfef859906f05ce15d6da68e5dfe2af1bce781c31a474b2b42f9b3069 +size 199058669 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..378adb317f3deae6f2e576995267506ac9c3c753 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e5181b21136d1714c46e7465a93fa53b5712e805e19ec09b4d221bd1291159c +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f779acd40e9ca5c5a9ef5eb894e123e53b534093 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47520ce7d20430310457a807ff70de23d1048c0d57423ecda20c536ed88ad126 +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dee65407acbab6be05604beeae66a7b4b132dd0c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f8f9760d909ff48d248a37502b191c0cf2e24638fcf7c920fdbe09dafcdb0b2 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2a69c6555bf0be73422e69be29cd8972c84c79e --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:100108258c5578bdb63904e3e1649efa22ca4c6c89e951a4dac7fe3d5c404706 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..604784b96840138d2f6d578a78389fdda2537cd4 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d5eec7571713c6134016b76b0b8750e6c1cfe97961f3ca8f82a6780cbd1cdf5 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5896104cf4cd44a823bc86baca837fde6d23b28a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2143e9bce7eba177df71ec436a6fad3729680c32ff03a3339c19500178014b4b +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..022e9dbaea214a4c3d2c67e01942f7b6db719bf1 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e2f96f55a61da615ed796b12036fd3a4ee1a16cf7d11dfce26cdeab6224f2bf +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9cac6d2899f20eccbbab63a1b6b00a9e6ff0aaac --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd0306459ae26026a6a9436e0e63848d3266f330c25800f17726379021f314a5 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a85711f8793778fa74bca58628050281c344de5a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f6b562c6f801cc35b36e1ddd2bf5e59d3723b3dc7a64ec709f9b9ddaabdc0f4 +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c0a770792e74c49a6701714abda02aae8a0de80 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cffcbfe78b9081df1e5f45014984b0a6763c8433f8f4af6a8730c17180958e4a +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e48b448a722a03cb854f7ea5b7baad80197241b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8afb37bf67b67a89c77fc41c28f946d0d94eeb82640c4690a4568e1d22e42ea2 +size 199058669 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a38745eae7d87baef540c77e522047a438f8cf7 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee4993757e643f56dc054b1a04293623a1247834f1673b28441a5ecd250e112f +size 199058669 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de53d55447b68d99e06d9183cbe4d02e90271383 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aec5db8933577ffb763868eb7c65d280c983bf8d6ba167ed74eee20d5e518551 +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28799165f16ee2a5bc2ce1b5489f0d261238d1c8 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:881d255f59d15120946ba30244529e3eda8756badf9a83ada446248154307ab9 +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fde4b1cb1f287ccad60e468f84b58560262f02db --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52618a31d4add766701f88f2ffd4f3f97b11dc0625f1041dc104c1ca82c14111 +size 199058669 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fe1c57564304801c61546149d13eb6ff2634221 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4a7f4c726e09b197a808ebccd156b4cf985a8bfe3dfb716a449943f548f320b +size 199058669 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1dca8c83402ba447be8d2912084adfd81eb2ea6 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:425fda68e851ccaa901da1762d6bbe70c3d693332858ef5fde06ac163eb965de +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e160457370266fa6d0a639e6b4e78785cba35edb --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f858e4703039c1086fe6278ffe0ed623b0f3b36c989a0982315439a47add13 +size 199058797 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82b0530503f83f392a62f3acfffad422b69124c0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6bd6a80c93f6b354a1daf3ef0c2740b8ccaa4e509859022a52a08c3b5253aba +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bec55391c1e60917ee0e881ce54a1f938991c0a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5fe09b3b1408967858f4dea8a981fe22e1c6be5236777514dcaf548631b6550 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d3a10ead92404915821cb3cbb4c19b683ee4cf9 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:423a2ba748ea716f9a7df81f285c4cf6982e57c18a7756146c8de095eb0e0814 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbd468c8c57b9441565f8b5af69753ee1327e7ad --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97d7ceb0927b2a79f06e20d698fade1d7bf1cbd920a6d23b24b0312e18b7e650 +size 199058733 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf844c0cdc0012bb169b2ba99c781291265658c3 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b1c66695b07dec787b637634714406e84293eaa70db77c4ccd58892576ec86e +size 199058669 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..346ad890a6bd3dcf972047438995bb0deaad3a29 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d1356e22763c017cea4640e09db8d9911c70a9e39f269ca12701bd7d2b67ee7 +size 199058669 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a179ecd2733c0767dcf5d112c34dbdf0555a120 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b59d0957d4124e7b03ff15a89a056430f42e3012d07616ca33f599016b8398b +size 199058925 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d24093dac8f73dd1a6b4c58f4d6684bda529a9f3 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d29c2ecf5c6f5660141106af815122ef0fba512d30cc213d291a970a6caf54 +size 199058925 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de025a0eab17565248b1c625097a4b6bde981f7c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c899635e6cc0e350d18349adb612670f99aed3ad20af48dea715cf449ad01be +size 199058605 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..544b581ab3e811e26f65db0a23b81cbcfb41444f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f307a939631f3f969c4a6dd0ed2451e26d49777fe90d7984c872f6dcca73249e +size 199058605 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa23275f84b0c5d287b31db9f441ed86455dab08 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39cfd3a72d73eeec7cddb40e8a752427e1faa85d7cc998092bedc66ab40423b7 +size 199058605 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f332c1af65a764908f65b012e5fbc9fc4876c696 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48910b8e4e0066a79eb81ffe89624bc1e0400a61392e61b3cdba21ffd710b6e7 +size 199058605 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..07923ac81f5cd59f86618c627e91949205eb87d1 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07e238723c51eba5c6ecedd0c8ed6830f4d3724d31e4dc42720443c90dcbaf03 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..189e857966b5042b667e53597590ecf4bfb9b20c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:516f61afd7c0a6d9abcdd2c5d4276e8f45868b240d269681d049ef1c945d2796 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..670592f6160abdde3d6d584cf2fe8cf396a19aa3 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9727b04563550f337a61e8c6eadebe3b7dcbbf01addf7d2cdfce7c235edb81b3 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ea635f4aaf05264a98bceea7d68e61e0f6072e8 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:801e5cc01de69264a45333f38097f06ccf98f1062fb09739354802d46c75decf +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb75dfeed6d65d49389d9d93f9f704b53c08de93 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:638f23b1ed89be006f5f1799cf7407a9e74648d6ac0aeca4cb3c7e8aaf9c008d +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a42cdac4f860e74bb2c4977765e35ecace4c5ab4 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da1a04e4082cde40a02491844bfe1e4f8d9f313f8c4915e5886d2bf2d6e57cc1 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b9daf461162c0d28bc85c1fcd418c481619f810 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4159d3a389ad6e4d2aced3d6b15b2cdb3309ebdeaa0f9649c38508904df6b8e5 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a2a8cc3bece82b763f84965ed77a8cd9cea597b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1726a781c283105bac07a36370b66f3daa375312e734fa89e1545c36dc269fd5 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f71d2ff525c8de4ff8473517d1d2a59ff5389cb0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c7ae9ad16361a89eefe3e9da1648a777d98284c073d0928fff2dad0fd1ef236 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..def969dd27f742a53a2085c1ff9cfe12b2af5d90 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d15071e581bd1021058fa95f3aad75e1c6a164eab67bf0ac788995167e14ac10 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e57752094c74546e2aab3442d0374315e8c66b1a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f48c3bcfb33c9abc3576e83d13d074f35e598cdf47abc3268a0cc0584f0a813 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6207c854e25d64c423fd4c6236f0b8a84175d35 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f57d0be00cf3a3416c1a1244642683712d59cd3ce8e2a5021f68636ec3630c7a +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..632d3a8cce11d2e34da8240223501d74c2d668cf --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afa26d8061128ae0b919a7c3da4ac4aca58712ab7651f92c27436b88bebe51db +size 199058978 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..635992894368f2e7d85cea864b6eb351eba1f97b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8026c3f4890828a083898aba91d42dfb79cc6091f2f21102f3d2c76348d3594f +size 199058978 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a583752d0c86272aca633cf332a080d89839a5f6 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37b0c51b0e349f34f898e87a4820515a7e76cba6e8b871ef0d133ec11d77db0 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43808e13a971260268624a2f0ebede95a9920d99 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d9526bc3d38b231006aeaf83ac705f60dda5143463330257cd882a895bce1d3 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b45e9ebc7681235b25f9cb3ea30e64eb7becf062 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbd6e70761829266696dfc8ce846fdfa71cd98107d8b5826ed2f4dfab74c0f69 +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df2fbf8a862c12ec981e1af7dec7f367b4a8acf --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c446650fdf6b9a7a8c411c349a53505ecdf3fcbd1e01996ed0adb3d8c780acf7 +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef9fc515500027e0e9778705bde78aa95d9a8714 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5283adc263fb978a476928bff76cfbc66778b0f004fd416cfdc191896c15fa8 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d618670b026d432885cfad71c582d48dc4d69825 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:524692cd77771b6744f3be6efff083e04cbda1aa1a64d689b4ef90d00628fa19 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4412bf5625d08e9bb402fef803fa4bbd62ad3173 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7901217b59e299ae625feba8d619630b0f4f5a5bd02895cf9290ad9ad2ffdf6d +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40ecb21d033d7b3b05ffdb0abe505f524acb7a1c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327b94ed22e09340d186cacffcd6a244a0a7df7445e2fa1ab3d0e8f3c7484717 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe1f754404fde359bdc5f88c37df4841ea66edb7 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6096eeb7b91ba826b1e651a3b6b3b19546a473847fbf4d34ad38c030cb41c78 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d181ab8eac26f7786aa58c5c0942f8cc3eb78866 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68cdd42ecc59da12d2538db79d219d117f5d14591c0c88a1ab8ed40e5245c416 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0c2e854e15e64d9dc537d20f93641ab66c2609e --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b27ca99f30a02548b647cfa612c379de1a655ea2d10aab7ef00aefaa167691be +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d677f0538dd4c0a2663dda511abaa14b15e67c47 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c489b337add6797a66fe5863df046ff28b301c6cc78663440270d3f3e84aaf23 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d42f395fd3bd752cf218a7e893f8ab01f0b68dde --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7a571411c74fb9cb53bfbb649a6fc195fdcb6c162491b93efe9469303e18153 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..571dd70c8d41b221e5342eb06bbf1f633ea2ea1f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e57d96c346ca27e0a6ff2ecf16b2533e29cf6aa8e1be5b1d21580ce7831f8af +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c66cd6bf6fc585f442d9d4c2389ff261936e34b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a000a36e07f187024ca780666fc7bf733eed04841f24b9e664b7d5889715ef8 +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..445032a69ce404680fc7ab529b55d9c0977e3c14 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9447dc0202e11ecec51e4e2c3c868321439205caf53a3eebefc4d07892fa2fe +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b60b4b2386acb9d864e57e6e7e13d04a652f38cd --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:194debf47e61b049f6ca2dc100244ef7c6170591bac9391a058e85893be9b3a5 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc841de7133778ab93abba5b43fab4dcdfbbd30a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f5788b1fb73e325e1f1ecdfee3a0ca27825594175e4c54e2c76c6a7a4e71d1e +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cf96810adafa14f62753644ad125beb77be02d3 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4193e9c49f8d712588b539f23ce1bc3304dca384a7c09be06045b796b1063977 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99aa03a9d52915efb66b72acb7704a9b63bf06a5 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ad62d38bcf57d239094fddf3b160daae616d10b76a3a8b15fd8d99fb391be4 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..306581cf64d94c8e86d241dc3f6e4cde760967b9 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7491f66cfae443b36edf98e0360772b25a2c9d47a2cd7aa1a0b1e3bb2c57323 +size 199058594 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84994f16afb6fa75ca81b11b4362669d6141a63a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3140e6a0a78b0e584e7e29ad51629df3c08acef7b6904081b72eae725a691aa7 +size 199058594 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37ed1265b5c5f9c1db5a3e19f0c7d15df71efe26 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c89cfdb19fe92bc9e89755fc39df97c0968e6c5b52bad614d91129b971309cd8 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8044646b736a833f6a45b35e385cb13f5ed16b2 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38717814562a1df0f5ef43b03986ae8c79362780748a80b00d1ed7e65f493fe5 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cf2df437b7cdae9a7e9c74075c1ffa359a9f2a8 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9332f5e50539f9368015f06e97a7db8dd50a853c816ede4381cb7e6445cd37a +size 199058711 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b046b1319edd32b92cc74de4b070d507e4c08eda --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24a6eb128b72e77f1ce934e263760712eef0a3202d34de63293305207426eb59 +size 199058711 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4f188a4acfa4b6084a7a0b092c4ffb0a48585b8 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a7c1b728de32b50550b5ba7824006c9fc72379ceb6d5ee1e3a9c29d910c2e4 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df9d726d5882d95377881f2a9fd8f77e4209b00a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9edd14057990e6470325114f8920666e66491dbcf5becc802932ff16c806666 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f98dca59cf59e957e69d41c2537a4000b972f1eb --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bdf5f47f63082f966559c5b12147ac724afdd3f30eb2a3022ef2c664ce47bf5 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3164030b45828b370f53ef085c26bacd83b8b755 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:329c4869a2da6e1b64077fafbe54921b17aa77e1135f27b8c34282c0a0005701 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aa2e7e53213c1d7c29346ed1c45e8d850d9cde7 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9cf066b6d4c7534e4d18c8169e13f75a121ed62b6050cc11062b1065e27fa5f +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b9857eaffdb7a98f69397fe0f307f2d41eef439 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4924e5c4968780d0b400a662c13e72c80443d93ddb3caffa512df96a3972eb6 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bae93c15c99e740dc355880b383b9858dd7e5676 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fb637b022f741d2be29d3156f8cedb205358857c03176b3495b0e8a6788c231 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c02428ac352084ab338a0b157d6758d8d30d5094 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c87b65754900fe47bd1c07a3a9266656d0246605de8fb4285cf9a5a18260d12 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..019074f5a587187fac6d4a487bfac37dad0a6978 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6a04d25ddf52fa866a07df3d46ef2858b6823a9a8d113102b4af3e57ce92e74 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d44596d644d6f9a19411ddb0f156f9530366217b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:653c19a1c8ce574bddb09d26a19b038b389ce23d4b4c48a73490e73220b5712b +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b4d8596e60dabfbc9c90a65bf2a34aaf7831b74 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4163489cbb380cd3abfdeda9e9808aa7b963ee2c5c862154563cfb6bd58073a +size 199058594 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddfd7a416dd8b1b8ec15aa0b6d47fedf7a519f8b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce549011cf2015440115b251274cbed4a22a48aad5b8624a022af927893d9e39 +size 199058594 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2de42ca3da9e3c6ed6fde4e6e78e7a8aeff98950 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265a59ce7b40ff121ea0340f45679e194071df825f120277968dcbb63f4778e8 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bca8d6a0ecb6e0013503052c5c5bdd7ef7927432 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a99f7c44acda78642403a488af47ec94dd3e86e3504e49724d75715a0653d36 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0e0c706e06235f31d92a1d7ab4131872729d5db --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f17d298053b7b21dde7dee702c1b542c7eab273b541929f8cf6d7fcb395b52c +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f1b698fb03a1998bb0ddb82ac8977763d6f1763 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5441de683acc47639f3c74b3693db24204825634a12998ea499ab4e163ad14a0 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bd6c34cebc23358c1995e10f794ef472f83e591 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e44add917673e3e02c3167f165b38c48a5edb7432a7d346a7c55110b08f7e56c +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdc4deb3afb89f1b3d1ac95ecdfbcdd23b0b00cc --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37657339d052b690fc78bf324ceff1505eeb171d07422eebb506814edee6323 +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5565be924f7c6b9bce4680293e060d9fd0bc1efa --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d122cb9687f6687138f82a65e5c14b0b7271c9955e9430af924f31435ba7398f +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff76ea9a9aff13b995d88673b1fe0c362404b058 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7f7a9d87112524ed67effcc9c6f722830af43f4bd6f7ad993f669f4c81b24f9 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48f8bca7c47b823bfaf28ec47be5db214d317419 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:203ddae25daf1f5595427ee0590d36dfaf8ac676234201209ff21081757505ba +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08615dc71bdf8f4a2f9001b1c8e8e9ec15fb7978 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94fb006023a34df0787a992bf3f9905f4af4fe6b9318db2aa9772043fa3ce0e0 +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab7cc63a9c2e8464d0a81169ecdbb55f97f10290 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2df439b246e8e516f1934c78f7cc18ad3b4b614d895b9f0d7f4f7f5e08e03484 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64085fa5a40a42fd9fb523fea5da7bd780d8949b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ba001d855704dbe954a7e5a91eb3ae8d429bd2e97da9945801053ad6a4797f6 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6859d0010d04ccafcea7b3c196bcdc7ca1f5e212 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddc58370c866fcb054acc81e7982cafb045e854f62374a6ffee8eccb0bf62b00 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4efd8ce4b469d16ec2c53e24107c4472bfe9f827 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb27f49ce0c7a817f60752000328042f51816d3241275c3467c01a188d8589ac +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75199b511a26d67e270a24eef9fa6ed207d368f6 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7db801b5cb10aa62c989a834126e2e4b0b3af2213846ef64a39078d26b0e0a6 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6712f79cdcb6ce9df42e0602eceff244e1c59368 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30fce93a69ff94d98724d0d67a3b9f409113bd1b4d606c2e87eeb458a2e71c6c +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ffa1ef13e772ed64ed7a7137f29b02df8c13434 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97080bebea1d5930b3336305a32f29fa66cdcc4ca6fb7bec531047cb0438fafa +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bd610226c10cbd1c872f673decb8da14f186ca3 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:424b6bbeff6edcb191a3194631876cf6d5cd2ddca3c060b9bbb4eabbe001d5ce +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2effb89a05c22ce8d8c570fb2c52f1b66f10010 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:878d2c89172a8c3d9b19f509652fba04d3fb8d2f80abb31061c328e19596e106 +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46fb7511b1f4ce3fc502ce515d1957a287985d6b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43ba77369699c96fb3c941b51ad1743a41521146becb094fcfa3bc612f3909cd +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64ffce1be4cbeeb86cec4644007f897d6369cc08 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153c7abb7dea0ff759bfada2e5e46141ac928efecadca199229cfa6bc0f28eef +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54592af6d76a1bcbe13d42e3f90bdf02a5b18f38 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4219988670522558554b5e9ad6c770bd8ddae42b15465dc80bb558c8b11851d4 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f108acbb0eb35f745e1f08d6513510f1a9c919b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70af285968e8408a2a26747e886939f249abacc67a1aebafde29e1b6669b6418 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46d8de02c530b70f7ca916e278f926eb8d1bfb8a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e869a4899e1701048021f1fdf210679b963e6fa1bb154686ff5604fce07195bb +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c9deb4de46dcec4b0f51ae886ad46b11e4be750 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fb6e76351670ff80816a8063d7610b8be5fca4c336448200f2c0daf52c21f04 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9a954cb7f353d67e43bca49d8a43f80621519c1 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8f2d429e52d11858e0dcbec94a57a08d022511364c5ad58374b4c23e3a3643e +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8be5915de0ffc166fcadd5699e3c1e08dcbade89 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34fd7912b3c64851ff4e60ff0db6eee310085c2d5e37c58500a902d7ce7527d0 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..139e0ceb2896c1a2c84463f2067f5f360269c088 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bdd197330500143b1f1d3077ba481656842233c2010a6b4cf64638e69911bae +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8738ff47faaf7469fa9e652d7738207207a2e373 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b256a90b79947f3fffeb1a5876f88ba74708719e232d8c3ffe9b5758847bc5d +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41c9254cf93f5c80c4a5e101124153726a38752b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e46883452782c1fcde789e7fb937e7e6a09c21102c504736a248d0b08d08fc29 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddac9f5cf1324646fb83caf36c625fb220b70508 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122f395f10b960bc4513a75be8b08621740315dd8321e25292c231839b782977 +size 199058775 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..337863ca2999fc1102309e92edd82b5da4f47a79 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb8a5f7bd2558bb01b53b017b7ac98957ca96f3eb686422f1a21f9df19354725 +size 199058775 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b814f9830163d978195f7bd81a4778ad6f6cf21e --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1afd9580c0c2c2c7fae5532f72a900e386522abd427ab0c0c739688fc6c7a0d1 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d4c3485105a9731f7a08d46281eb75ed82d79a3 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9039b2f6bd0f3914af13d2b5b9a3cb2e427aa705ffaa4397864add9a5534a4db +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1defc2f5aff21b496e32f5b5eac16e9df3ecab90 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7d170b7c66553c490aa38c519f66145fa1b5ee5bfa58bfaee416c568d3c9b93 +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..540dfe17facac73a6203e8c4442107b0a23e215b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3d0415d22eeb8951e92a89894f33d0a8139cba7161d5fc0d20bd9f6c0735611 +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5461dbc89598b286928c009e6b77fec8ded8a91 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67343ccd3761ff9104662e0fcb8c2ec3eeb7165586fc334daece9c6592ac2020 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5ade550ad7ec455a991305dec2fb0977c67af24 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b50f9475c975d2c0ae8fefefa08d5bdaf7e71b431959b8463b6848c111bd562 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b7f71c34b3a4e65a63be8d90d0a444d76d6e2c1 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58c687504b28adb446f2e4c73410a7f7f0aeafbd8f772b024ed5352e5c837e12 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69ea31aa815bc9ad122a48cf8580697a6e6985d8 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7c39a8e269bc5216ab9eada79238b45a73f77e6f24a89220989a015cb45721c +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46f2d1b6aea4756c3c5a9636f21acb28b5aaae39 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:535a9740bc949b37d1bc3d0a674c8fc9b6a5507b165fc644e8edb1691f7df92f +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e6900fca33da7634529c3d60b963948366bba5c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:864506f7954801ae6659b4659905079b53a8395c82463cd17a0019dbadc8738d +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ceb74ad39f3d87cd73d45341d77b0f580ea8dd68 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb97712450ee776e9d220973dcbd0dcddf330c426d0641a363fe62d82a9f0348 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1782c35e6a81b999771f5db02699d9dd38f28c68 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd073ea96378f4cc3d5c55094bb9eb21d5c2cf2152ae4d37a2d76adea3d7387 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..121a84553fa6f3c878df35374318ca7e6dfdbfed --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0715b08efd811d918d8c498e5b1e87bfbcff0885b8312ee6b6819227dfb9346 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c17e10f612ca1d63bb8bfce6e68fcf24b5c5cd60 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0b1dbe35e3e3eaf12ba0010c9e5f24a6354ef896fd6a1a766466e28c5742e4e +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82eac4e76fdb5fcaa466949a2debd03225ae7695 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e93a776de45c5b6623646bdbb852adbafa9ae7cefafe434fdba82860d7b148ad +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..317736f80d5cc6e7148a1a8e22cd7f0ee03f1d3b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a6ae1aa1daad8e896a9315e74a4f05baf934b53bcc429b1fddf9c3c73c54295 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c84ef8ff13c384233bd922b86b9e26eb1347ba4a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03cbfdc7eaaa1e4f5e33dadc08b2847bf57f9b83a3ea5425a5609c0ad9512bb7 +size 199058914 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06cdcc6326c7e2189686232de49b392df2045d69 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47967487019c98266159a38daf957936e9c9298f5ad69f37f256f5cd09ae609e +size 199058914 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1382810ed8b5179bc7c468a784551eb208b5157c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10135af1b928f00d93e1a7590a173e34c084000bb5519745cdf5632d2273e16d +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b8599d6602c7e1aa6a5833a6018a328b4a9dca8 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:121b713fdf6938005f9d98f3041105cecc0b5fe9f3b72185a63e8830ad2a26eb +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e232fa2358af16249ad8177e81469408550a853f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3639c560e630a993678a098d113867f81516ef0e473bf3cd8a45e0bcc98cf852 +size 199058711 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5a523022d79429a444475e8b5a94b9ae705f2ff --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9f547c9416c4b55f18d75facc154b3389a063e1371222ef8d87fa34e3a40add +size 199058711 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cf53297e0c453b0c0565c4ca386242ac5ae67f3 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0219a7db684c99776579918b926835b95e070ceef8209a05e267d2f1745d6dfc +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e171670f1ce77319f38a2218fedc2c4640aed811 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52c53986bab6957ae2ec5cca01b9f1d0d78cd6ff1064b4dae06506ea4c9950e9 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc74007d2033e647e10b4be49a97066bb1a17d8d --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9ae386184e0d3974310bd06d30c7b371afa3c35cbb8417f745465e85181b5fd +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f257e1c06a3032b06d9df0df6337a390702c4569 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61b127d88110fb70bbbdd821cf324b2c0dd3d80e942d154c2fa62c39c1d50145 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b023d3fea48a9cad66ca6662060d5b95d44bbc81 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5b578f26e85ea782440d3b988a406acf470b1a141594ff8e52bec25126c0b6e +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64664efb51df0da4076d32e58fa2207aafbf6e19 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77e5dd8ad592ccec95c6544845aed5f7cce8046dd9f81e5e98cd60035ff0f16c +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60eb32fd2d06e23a777df0fdf2f167b53ecd76a4 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b876a32c9ead1d65171dcacd50169710b3c49110a40ffce4193026cfe8d6a755 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc8cebb463726cff87b28e5cefd0cbd48bb9edd5 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0b5c2096b56c0c31f8964a211227e9bcd18f2e39ddc862a3257155dc0b82222 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..273a5e021687ae96434d8824037de2b79539e69d --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5684edb2474d59cdc1db64efdc2a9215068b5c52cdb6d00134da0e51b16c5cb0 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59a7da9c9440900b0d1c37eb5ccffe9c9d757ff0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:548a6030f4141426f6f51d2358adae8b5661885b63c3a25e1dbeef93f4b7937b +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24846806f0adbb16b3072f86bcc5942727bec6eb --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cef0e9f3ee2ce0038875d7ba066d08b7596b3fdc99fd537fd1731444cc153ba +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf5089162c3347df960a4214f63e2f2fc85b2c7b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48e8fa40735e2510f14e4d94b651010daf846be75eab920729c7726acea404ee +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54f13d07004e43d8d5bbc1f2d1d590ffb6967708 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56df15e49ecb20ea78b98ff8fb1f447a8518d49899de8c51f50086d8f8c920ea +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a66bba0db3a0b6f6a2f2386ef337b9ab2aa3c49a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:045b99e1f76567b0f0063fe9ca04302790abad698ba83a0516c77e99c027d87c +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff3fdf25908a09daf4f10affb0e14463795d5672 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2eacc17390ebf2cef422e557504812a1d8116b72ee945ee0936528acb2b32caa +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1db57866e6a58c8d1d838f7c128d60f9db11a43c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfc8d8deb140bb3db290a40f261733757f3614d9a4da59afdd352ea96d4eda66 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0adccaeff028d15ff5d0b16c2b960e9a6581ba7f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3b27f222096ba6952b23cf8c4365144bcd137b2ce733c31713007374e56f421 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdb687a6b0f0ac25d14cbc7df08e9ed4c31c522f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be1d7f60330b637c2ad60aad0a198ffb3197516d53f9f1aff9b67dd858eaa400 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91c195ddcf6cf25f8e341bdb2ba3989a7f19aaa7 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2c2ba592cd13089df295298830535f6c8612f393840b4b522f47714842beaaf +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bb9494de374bd2a6aa3f9fbd244f3f6e7fd5104 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a449f2e7b25bcb9aa9cc723e44d00f8fe13029c71520bcfda3a816f0a347cdc +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95d15cfe7b221415e6499e860955594ede391471 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c389fe5bf0048ebb3f20a11bcfbe5b400b08dccfc9b096845ee589d2b0a5a18d +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8d4b9304802773e54effbeb31107313d9c3e769 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a29b4ccab8b84911708fe66460567dd2b08519b351a3896d0b05e56f57d5f791 +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e08189ef69948785de0d567b0b55465b4f61921 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:790bab49272a566a75e4769a84d2de4a3f09e0007dab36a3cd64b9d366a50b52 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b4b6853fc72b51e4d7d8b76727d42ccb4e8421b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1897982804bbb9300647b62b5e31b668ca692264c6a95270d98cf0d627e1f559 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74d474c195cf1ec09d67e9e9629fc68947964d70 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b1d362a270722258326d0ecfb0efcc4536fe276b073d8b42ea1eb0ddfa81428 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffb79d32ed50e0094a4419ce3bb78f7688c85282 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf963a78251196d42b6f94439b544b35ef18578feed15a7f6e2e3ec78f9fee97 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8978234f25c6454a09babb974ecb97e9b157c200 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1378004468f78d00a1b0cdde64cad0cf1acab3e8eaaf3a7390f09095e0471b71 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2323bf9e4871bcdb4a6720bf853d2ac902d84ed0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73eb0265138c4cf1e697ac3da19253449ab5f9de490083d0d86da8a1040c9c82 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6888c77dc530ce8de92b25c4ca6c15fe3a02d72d --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a8e6e17d9e11806509060c6994e6149c574d0d687c7a12bec01451d784839e +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..335f489748a207c666b36c97a25d58c5c911378c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c22f03ac29244f726dafe7fd8712e48a6a09ec93ebc9c2abe7fefa0d806200d0 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..643975e354140b80bc2d21cb9ee11832dce70367 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3dac543d66aeaec88999aa1210db3759dac6b8d9113c7b370c7f953a669b5a6 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4907c8a6e8469217be2594b265e79c22c224b28a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d6b330c2b32156ce03b74dcc82102a0fff10200a484ab0d3ee4a6389d70b1a6 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34d9d17656de9e5e1c44c98a4380046aaa4f0899 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec21604aa011d8d112b60fe2a9e43b42d41d178e3154328827c2c65ecf08b2f1 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6879462e72ea37519c1df3e7a3ecff4b506bb227 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c345e01fad0454941d12f636d3a230f792682d1a7c29fdb4bb279ecb587145f9 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa655334330a69eef2f90f962da8bab5fbdc8188 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b06a47f91228850dfffb116ba735274c16cf768a752e1372f02df89ddf5872 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96544f0c25bce463bd33a4eb94cf7f3506993508 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5838cf5d478de1895d4bb38b255a753973456d2e1fea1cfc43ca36419b5356db +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6228c627d6031a26cac96f5fa8988bc16fdc3a39 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b82f2be51d5ee1e7340734ed1ac7537547047c6dd161f45da04f8fb92a535fe3 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4698d834cea03f0f510c5838ef570a8b230ec8a6 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:316ac9cc91ba874b8816e7227052917352510aef21711efac81275bc70abd570 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a09f1a94f96903496ed1f96ca0ea29d5e16dd7c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e919ec5a66b447c8e7f60bd71ee7a6f374f0aad283b7004db36026cbc0f0cb2 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70d188cccf61106718200ba1a6aff7d39e4a4638 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7049039f560ff8c08ce026993c69fe679e0eb848622583ac69ca0f55bd6b092 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de0d05bb8e215cd6a66a05e6be02dda452dfc3c9 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69eb4899079cdf81cb2cebfb2f576b5441d548197bf1082c20959e587d53a7db +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..175cd537716b8644ecb7c6405f239470bbb145e3 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2caeca337d5ef272cc2b5313d5faff92bdf2df608e190d4173e1847cc4e5c4d5 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30900caf169ac7912e527ae50fe070cd755e4b06 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0999a67801a1abc89650dc7dc15d114b8d3a8af1972d416a7d48c1141e1083a2 +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a12102c6947d1c65b891599529ae30c15602732 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a37911fd932b2c1f980e0299049e83c16f96d10ce0c787872c065c0cb977df4 +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..758352549868b2916374abd05618bc326a13bb58 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c6c6b051acd3d46327a35ed3ebc5922465020bb6e60cef4baaf62b0a89ed4b5 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe10576d96dbd9d010b4d42dfd78481463124e46 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f3a839030e666416477fcba5cca2ad425e18c3dda68aeb75abb3cbd16e4463d +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3033a5b439135b4eaee5c4a07b7edcd4a68806ff --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1419c5a697ed4db26bc395fc6822ca3dc2f39ad13f2268ec38bdad3a2d425833 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..932a98733ecb6c39acc0a1d67b9fde6c8c30d60a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b59a020cb880b7a6393ca009bf3b66eba151a084e7ddfc1f884748f7cae2e77 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6135c16e41d74adf391a8f68380a9c2593c80a54 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690f857b16380afb1d86735c98388f11803e5b35413127c28d7842ff9b83fa44 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50e302dfe493692eacc79f05f5aa34a48fe586c9 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed9bc7f1bb7d25b9afb41c22537ad0b7ca1fd919334be0f9b1336c0f4078cf1b +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d512364d97b0e525a4f04260946b946424c40def --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bce05873d5730f6bc1e3f6ce55979e5cac8c9b1b23c0ccd02bb6c7801f57d23 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc622de09c47fba65d74950750433f1d4e49dff3 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d588fabb524ffe42fd99236e1d546dbc3abc127e3f76cb61b1d1427b382c390 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..595e66b3d815a1e1fb11f906e5e5a3c92d19d660 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df5c210ace287e028611bce60a07cb2a8fcd232564a0a2dbf3244686402c3b32 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51f39be29d6bf621604b13db9a31caee07f38c24 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e9e55c85f61c170682f710d3251dfcce6b755cf7a326aa05393aa95194accfe +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48423b2352d8cef1f3fe09d5c533465339d105f7 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17f21c48d2930b53ea9e89618593d9c61b08cb09edd9339392b4f5bc9876e2b3 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c12c79d4073ee5e3b131989035c5883aef1a27d --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19222d8bcf7c05c410c4f0638238c63b44aa0ac68522d90ebe874e7189ac7045 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa71b791663c2c524d96d4c778352e7ba5c56f7a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dea39d877f3373469f33444da6665e92b662583b0d9abb9b63cd508da3a9c23b +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d9a9b56cefec70917645be220eb7b40917b24bf --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3df5acdee128795c595f88fcbacf7359a01cf143d18bef1606278e3cd951c56d +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c8322ca237227ecf84df72b45fdf7c6d5c3399f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e36a924f54f2d7cc961bd1546c29aa9e34af27efb0f965f9b31efbd632b9c90 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c3bba2a10a369540e218b00c4217e6a276099d0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a45e4e037df1272b2bd15dad9294f0a00c4b78a0cd524d0828c79e830c540dc +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c522abafa117e8b208dc58ff7bcdbb69a97fd6d --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1f5f583d05c10f2df483fcc684ad0d23012d45344dfc5d1002bd5c7c6682ab0 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0777055f668bdb4ce339b4aead0291aedf6fc2d --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:539ece594505dc4dfade8dcaa9cab00a7a31a9c5ad52ac7b7bef828359b2be1d +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75ff69a4da2ac686ba2f77ced6434570daf6a1f0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22a68e100cab6862a0ca107e98ba44cf5c32e007c5073a5547a728153d901557 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebb3b128925c041907187c297d67a0cfb3a7ac47 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10b5d0131e685c4ea441166923ae203bd2f4c654ba0244789a6fdb2f7e45af0c +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..948e15b6c46bfb1eef13c7bc9c02e580391f0d74 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:079339c8170b464e3b3a14a7d5010b937e442906824e8669dc46f4229a6442d0 +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fe97f7d709d6bf07523145e494cff26b07f87f0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b9ba5414640a2567d56ab6877dd72624cc45535cfe407d4e5d125f995794284 +size 199058647 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..955660369737bfb950a8194c21518341f80c729b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73813429b5b75bba41c9796e037d5938969c13dc80e28f99d9499a46f4c86d54 +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ecf74e150cb1bf618d7e06fd94d5585669364e04 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34e10d1ed568cf78a1ab4937b7ee716574f97b942d54ce3895f017cabc3867c5 +size 199058850 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b6ccc3aba7c2e5d7ba81f5498cbac927fc74983 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed9cfdf53f47d7ab0558bd5b1c8b2bb9d7084adaf3bcb896fc460256c731504e +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be1373c173393da90a33936b5ddc5df07a2bf9c6 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bab6030dca6aa8f776bc71b9126134f5b4e055af915d69ef8edd049b1039e3d0 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b210432dc13be58cad7f34af89960d79aca931f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:542546525f221dca8ddc876aff02e49dbbdd9351dbde82b35dc209c91970c0cf +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fbcc80d56f0b5a50aaa940ea4558ea8c2532bac --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4f56248018e7f9faff5a64f7fe94ef10d4a732633d04cbbdb7ce68845de3299 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a371e448392d3b838761236d3c8fcd8e1f77eb4a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd796c81fe09c39903def030908e31c502dc3500c65a09da9b271d5858d56046 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6244605f886cf4afaa9d55562ebd39259fbce136 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa50242de13ed89d357ac0d476f6a92183219d8cc8f08bdad92c263127ea3f65 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97c92b82e0c26ab710a59091b9b827bc0dca7ab4 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66ed5e461cc3e6e336e5cfc79646c7ae035f1fce2fb5597bb106db1c5f82536c +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81519df38e10da098aceaeac7740c74f8d94efae --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1e6250d30ebb3fa18778015cd9f421b03c8d6a94e4b31582227d65b47f6f776 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbbfcf935dfd505a14bb0252c08c8c2b2dfa7e7d --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50d66a48bf200698c898f1ecc52715048c14e2fcadcacef2ab27eb550177d4b1 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce4ee09d1d6088b6db42669701ef493045619d99 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:137f31c38d8e12b92f3bb14a12dd89641fd4aa3eaadc2dcc93f276b436816036 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f3783ceb1cb805a5853eb2e2ea8765f6c8f20f0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cbdf52e25bef28036d2c49ab910c3da9696923fca806b9f98514c2bb87dfac2 +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a9379cfb184a2b6d8e2853df48191a24c259621 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:035570fa1ab3bb2aab54af1fb591fdf93325300aab0db7c8294c040ce5a1fb4f +size 199058722 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec4e6c321003f2d55e8ca4868a5a19e3bc83698a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcd88f0969c0f5601b9ee2aa2ac33f1914d29597e1f0fc4c4734578935d2878a +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3446a2192470769e5f0b44a8b875a977210bc49a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae3ed5074cad5b55e820407a877093648de8b45601bcec215bb398b87600d311 +size 199058786 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d18d48d2d88af790be325d089ba77008d817df08 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8a0a1be8c88bd49bf4aea66b2dfd025e0f7bdd516e7e3bf39c5918778dd2df0 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8345b381f3ae063c69024d0f43ae2d883004575 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3be2b4e2e9945afbb190e67719604774ebb353ce387dfbffc43f994c337f50ae +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57298df1754d3ac77d40f3f9c458c97fd24778b2 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab80aa4350facb82ebb2aa367170f650e9f1ffa17605c4fc7d901d0e166d75b9 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6f0d293e99a1dfe1edceb0412369a01eeb89f42 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3a9058592678c3be6da612b7ef28192cb1c15dc0d4c3fb3c5e9cf806ced6897 +size 199058658 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c5df5b1b86901b2470066883fb5e084439f0532 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9032b63798a900790bd0159371ecac3059b804ef3cac9f9fa4f4c29f0e96c84 +size 199058839 diff --git a/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61e76e46b221aa547a9e4857adaf7b5b9872bf28 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a7950f9d8e1c8211e7cf689850361e81e1eb3e6cb42e1c97b60923649dd3230 +size 199058839 diff --git a/4b284b1b9c4seed1/global_step80108/layer_01-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fca2f11853958ffdab88deb72695ec9b0b4bff66 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:daee0dee0fa247046bbcf0f173d0cb4c9c78780c38f4277dbbdee23a56bc3c70 +size 167511299 diff --git a/4b284b1b9c4seed1/global_step80108/layer_01-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32c28caaf6c6a52e8f497a6b6a9f3ad74633b8d2 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fdc2d8112c9b2eeefee8d1f16cec7c95f00ede7334db4daa097da0d76e755a6 +size 167511299 diff --git a/4b284b1b9c4seed1/global_step80108/layer_03-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdb8b84bd11b1e20c76e807260f09eb1f8d62018 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d48ed07806b721cad33a6b251c2796aae5e3822945f30f4b84342e74c0fbae88 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_03-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fa68e0cb6de72ce6aac5bacbaf1ad305fa59ef0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff21f2afb029ed410135929cffafdcc3f6e7b55c946e942c6466040b09bc1da6 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_04-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a8a063b5c05e45615e36a7d0fd99b33315ee9c5 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa90d944feee38959ff202c7a68dc8c7c162b591e23475ad81c2260de88b18a1 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_04-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..659fc78ad2c2cf172d77f40adb01436fbfcd4d5c --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c6af049a1109b131637110b6ade791aa4f0b35319cafff482143efc67eedaf +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_05-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da0de1edda206a4ae4e104bc196fbdf3b2697ec --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f4a8e4240c73940e3891537fb0b57960544c95f8f86706dc49a329bda9b95f2 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_05-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ebf5cab37c2b91846b7a34323aa0db96707d67a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43557fe3a9d45df65bb947ffdf51fadb4388c115178e74817b6fc0baf3d25808 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_06-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e08dcfc2af3cc6b115aa2260565a8a06d5c7b45 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de276865be73c2fd38a5f98e088c8d391a887cb4ea8d89bb950d92d964e97170 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_06-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6b8a059d18fb262398d1d69765363e8b3bcd39e --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db20b73a071198ee0bdcaf728ea864457bc1f2f706b4b02189bf6cb30dffc973 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_07-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6378ad8870c1df6e88657a4cd5674fabe68db5b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7c3a37e1b1820d0166440015ecf01743c552fa53f8bc69dc394951b43da4f36 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_07-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c1e73f37fe37b3032db7159818dca2ecf0dd527 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ada0b18f98594583e0866b567e5a5529dbfdcae5fadadb3af749cb70c0efcb +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_08-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f110851d0a0506155e821bb7982a689e2e2b0cc8 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75801ecf3ba0290e0368df210370c58fe241667ac1a1d6bc7a323cffb8b4fe85 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_08-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5154586efafd341f03412f00c5ecf1f73cd91cd7 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5d644d4a596916f072aeeff752befd9982129ef7ad7de6e7d141528e91dc401 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_09-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b4016431ee518104f259931f09421003a959417 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308cb90ccfa220ab206021a1fd4b0437006cee254ba72bb741b764d3038a2a47 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_09-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e0a2d1dd1f247f0786b788490e70780c881b4d0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3110d66a20fc6089019f8e72770b3cbe3ed0f68a0ece72865465e04902e6b1fc +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_10-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78feea2f52ac020f7d597c9f714d1e545a7abaab --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:762a83b755c0c8f7b64434401b055a217c39982dcc4ecb4cd0e69c51aae7d22a +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_10-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c88a87d428ff4fa7ffcbadf30d0d0dfffd761ecb --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34caa6610a0d883d6195be51a46b0d447941dd875c6a56152774dae1d36193b9 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_11-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6efeca8dd31c014696394aa2147cd016c302e3fc --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15be455d77989b469d7cb526b095b15bc16fc44fbd2acf86c650b7cbb1164942 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_11-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d8a9dd51196971d4e6cd0bc004f50b5e17a50ed --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2831c58f7b45f98ba4343b2d4d8f894b26749709332cdda83be11447eccf618c +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_12-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..701773cf5d8bd442cfe2473e701c53713212c792 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57f1e58267008b9b927d2dcbc91c07bcebc380246f3ae6fe4316085a67a1da72 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_12-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9023f46bd8eecc518faf48fc38424ae6b151acd6 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d362b0f79208ab4fd3ddbddfb381c1e8b8608ed155c56c5a00f1b2bd0f35fe9 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_13-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95d24a0e31e7b41c13b78661ae51ea730ae7d0e1 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b3c9dc56e192b79f4b4b8fc5fb448e00e206423bb7ab416398db085ca007ded +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_13-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2510f4ed6b88cd6fe9dd034cb02518fd4038b0a1 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3bdeaf687324ccc33d2fb722c0393e7ec42be2c9cf50d8cf344604808842742 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_14-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6e9d8bc9c02207a79c8da567b6b39a5e8a1c767 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3430371be7e64443680431f7118a4f93142354d09b9b6342b35dddd6d90c23a1 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_14-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ca9164133816393f2daf95337914ac33d494b2f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7fa13462c0411e82794f2d6d70f143a176b147eff0f756fa4bfd5ab2e52992a +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_15-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fcaa55fc25e6e20543e5919beafd98c0174aa43 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7daf9cc394fca6fa9d541b315773496f42c687a971aaca2fbc7ef0bc905097ef +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_15-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e12e875e17e9b87fdcd736380b341390472d1da --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d31142095de9338fab989a46f2a60413d9e08be5a602c3fcde5769d96ad2c6f9 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_16-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60add93121dfa6bea9c145773cded8dcbb3e37e5 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d817d85a3f8111bc597d9b145ed5595b9d0bbb789634f30187bd5a2762f8254 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_16-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a7e5434bef15cc2f82569cb0c376de02038419f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59d463aed7bfb1e8fe0eeaf99bd0dab1f3df23e54fdc7af26c732d52f040c571 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_17-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f825f7506bbe33c651172382236e138b40aa3faf --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b532a34f08b0af449f063544d3e33a76df5818800f3466269585b23426dbdb4 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_17-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2827964e5d070e5e466b332e6d14edf91f78d740 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df8f35032ae0551de2c29fafe157400a0989116ad552563ef9ebf00a86860057 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_18-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce76cafe41dac01799ee1738e1811e3bebc26fbe --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f63a144ed67aee51a12ec1c079d88ebcf5409806640deaf8232dd22f2565bf7c +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_18-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9faa72311b07f1286ce2c05960b98691ecc680dd --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5940f24e92aee3ac75816a1ba71216e10ba76055de71dc65e93deeafd44117cb +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_19-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c70c2ccfbb1893facebadbf74648ef418508adf --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9760efa072624d48ae82fc11b59fd32d4e14feee2765f451eb532400dd08d27c +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_19-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd127eef5411ad2ef00830616682363b4a50b0ee --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df85e01ce2d4112211d40f31e4e2acc90f7a9763d3781234500882f94a6d8cf5 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_20-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10beb6f911c2d67ea0b03b2edf1fec3cd923c296 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:431b6dfea919357b142666918e236065dcd1645cafc24fcbe393a5db5eb5554d +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_20-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8b559da436f1b2044b406913e7e78f06cc3e07f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf1842c2f85f1ab5b6a2a1a2b4b32595b2211aa5a30acc84c3183b98987f8fc +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_21-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3346b64ff7f57bedd67238e922d093bfc9e0f14 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8e58b7e11fe21048e6bd01467ac12b08fe61e6f5126562bddd33fd68baf212e +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_21-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..649d39afe3f8de14b810c303ac56257ee363495b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca8b23878b515781d554e5e34bf4a92550d4beabaa4d1b36b45abee5052ac71d +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_22-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b24adca5ec67fecbd6fcb10d48d26a20370e637 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d00a18cacebe36d114b41c692a895f9bc30bd9a4f4f1c57b15ba63f04d557d37 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_22-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c1d262671771e0a6188499895b4a583ced00da2 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95f71affb07e6435fa78dd3c381e2919b02e9cec817239af041e9b99cdeb34c6 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_23-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebef2b3ff675e2ad6ddf7a20be43f4935ebf6e12 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7d0ce78fb38f2f86fb63d326d87728a2a30a8d3b675faafa23d08f267766649 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_23-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f81800c2f3234efa73a19d6176c9d15f3ca1942f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:892e9ba485f55e3cc428c04eeee38cdc14674d2fe96279ac0c2620cf164fe6f7 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_24-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d462eda124b5ed92cc218714a5bee2e2c1bacc4a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d32c49ce1b15dec9fdaf1e76621fa60fec5e6301da1aee3b9ee7c798631df1a +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_24-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa102758641987be0dcc6b0b33e6f6474a4e7c78 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da309cdcf995bafa7350af228f6209eb43fb6390bccfe987a827993404acb304 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_25-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bea46c9bf85e4f34213308f2ca8b581e453514a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce5ccf9858553acdfbde34b9b5de4eac9373584035ce46c8c62c308cc5a4f717 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_25-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3219ae0e12aa8942cfd0f8fd6ee216a411f71cc1 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e7cb18c482a7aee4903f007476957daea66898b0a9b0eda6a8438eb61fe50ba +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_26-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..126eecc92bc4001911d059baac1bb32296b33891 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d87690da160a94fc930186cb07971bed838b63ff7667551e9bed60aa447bc3 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_26-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67dd94439d423c2a3abae8835617f550f831ecbb --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dde81cf3b0f69e5a61509adccf0fb397800105066e680ab49b88a9f07371b072 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_27-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..504a7b44c399cb888f6e69906501bad87d6e0291 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1f05f48df2e207c7d97077f0831b1c3d231e4eea7e0436b02a12a00f8cc2190 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_27-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dfe9e2026108ebb38559db7feb95f95fa6909f6 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea26755cf37ef2e85ec15eb334db1c59cfa8481cba98846861ef766e5a2d3fd1 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_28-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b80ce6aa183ea958efb5ec0d74360bdd15d52eb4 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1b80636dd69985be8b2137d12c525904fb5d49c4c80a7ee7f2da5409c51077b +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_28-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..440608c47cf194b65e81d71c528bce7abbf4bf31 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:371a7526be703510b97cbe694dca4a166cab87d0bddb9924a2f58a3780a1ee7f +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_29-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5068ed47a232503cb54769d44f55553497e1988 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb09604f383f69064f8cea13816deb27541d2c5c6a4c22a00569bf5ec3a1ea9f +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_29-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77bea0a241db86206bc3d0b2c588ba468fb529e9 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fc8d1c75c787f2b499a652d40df5f266fd0d574fd5539739f1b6172bfcd6ed1 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_30-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d077f6f0ebfa1d82e7f6f4d98a9e3e86f520d27b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03fa229009a219d6bacc6ef211f9db724351ed1a2c7bd9170d86a4c9bf24694c +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_30-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32c20b7ed4812a7f5bf0a8596c69c7d8d6633a1f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14d141e255279d9e04c9fbbf21cb844260feee52ae0517a6fa270f39d6c8826e +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_31-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ca1b8c14ac48514c3279bb27a3e086513af474e --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94a213f99cdee6af1ed1e7f422f3d14529dcfe652984c8c8e68a43fea74650ac +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_31-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59d2b5ee591756bc724d81430e19377c7acb93d7 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13c3d76a867bbfed4672a4c809486801eb50f95d29404929febc82051fd40cd8 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_32-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81e019262faeda2bda5b782600fb4f86b15d1aa1 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d05cdc0512de6c46e484267ddeda35ae0465873d6250200b1a80ca9b7898207d +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_32-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..543339ef8c089e8b8422799e14965d96cbaff61b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:077b904a61d15283f43623f596d4c9e7901599bf872b4f80f292c73e03f18de5 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_33-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbd8b06d85435c6158d188e84ebf0ae496097e96 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9d4cf170185737552923e836ccf9c0001539d75528f747660370c16fc7b0c5a +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_33-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b85eea7ed345e928fb6a39a844bd073cf1f164f --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e07061dbc842fb06c4eb248e7e85c2a428064b012b83585c4ce5a653011360a +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_34-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0002ecaeceb438a6d0cb5a2c53d34cc34cacecc0 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c6e94d59524343e9c78b70f188d4dc4ae9521033216f9db2b5e6f6654e8f3c5 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_34-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e10d6a51ffc67042ae590c3d75004a340a650fca --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beed5a12a975db56fab70a617b9dd02f2dbd956e083d755a9f45ccf92701437b +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_35-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..894160d665f23a689045ff2867064e49e524286a --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76e18fd653a7a172fcc284f6953f58b7827f2e5eba8db5c6a10be81c2bb18e67 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_35-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d0aee2ec81d4ffe04a8107e0e4404131936835d --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a9b07e7bab0121f3fc48b7b846ec294f328caa92fd8a1a235c24c5378adaeb +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_36-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..381b41b77cc69d883fddb9f56b84b9b830890ba5 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be56c50a3b824bd51238cc40be30460e8ae0aacf51c08a0e916a3600f0df393c +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_36-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a69638043afcab44eebaad8962a15f28700b17d2 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0bf520c0cb28cb33eee30bbbf144145b3fcf5a666ed899424458aa8f78882b +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_37-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55f7d49f04abc0ebf70b3af713d1c1d68a667a9d --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3372ce778dafd42ce99600386826abc5c04f658d0e39badda18c2b99c3b441d7 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_37-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f0c47cdcb234f2bc94e60304ff2d08ba5deb1b9 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13701977e63fc0df6494ee348dea66cf83eb65e3cf2571da40295554914cda74 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_38-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccf1cb0e17228fcd1f08fe39c5ad5922e67c2787 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b2a5d54ef207db218d31029b768428d94e9c389f4027a30341ff67b171e7157 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_38-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9316621447bbaf41bf28ed2582ef0fc395ef9db1 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5975bb21770928b0bd2da5a64f0b86faf4ef67aa16a2230cb3673d1c7f4dfda6 +size 113308931 diff --git a/4b284b1b9c4seed1/global_step80108/layer_40-model_00-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1859429e4f8d81f0ae7b93772182e3658699c5ae --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48034951867cb71cf62399bd69d674727e8d4f911e22e7015a82a27f062f16af +size 13507 diff --git a/4b284b1b9c4seed1/global_step80108/layer_40-model_01-model_states.pt b/4b284b1b9c4seed1/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d22eb3c4bf1dc81558d835443114a052c466985b --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff0e0ec947bc06971027f7e94d8963cae5eb82493b348af93b6dd8493770688d +size 13507 diff --git a/4b284b1b9c4seed1/global_step80108/mp_rank_00_model_states.pt b/4b284b1b9c4seed1/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c4d9e804134a35397ce3bab06730dc2f7f80a62 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67d0f23476f7a7393a89936770dc1d8d0a7a560c611a8311d8b1f5acecac3297 +size 51507 diff --git a/4b284b1b9c4seed1/global_step80108/mp_rank_01_model_states.pt b/4b284b1b9c4seed1/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f801974ac0331b87342a70a9e3c7310b28c81654 --- /dev/null +++ b/4b284b1b9c4seed1/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee1819023de23179df0bfe579f74530a32fd0649456b1fdd0994529da7e1083 +size 51507 diff --git a/4b284b1b9c4seed1/transformers/config.json b/4b284b1b9c4seed1/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b1b9c4seed1/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b1b9c4seed1/transformers/pytorch_model.bin b/4b284b1b9c4seed1/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..a4d8ae9f2225fd0274cae6c7f3a458c2e6f0fd74 --- /dev/null +++ b/4b284b1b9c4seed1/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c1cb53916bec317ba024bcba6cf8d2bf8f898764da06caa788378d8d1f8dd13 +size 8781203669 diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..6f34738406c99039d660718eaa0af56d4a3efefb --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.2736384503031292, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.013761131588040647}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06743672908113135, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002638252273936629}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.24234907953353363, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004536576899675782}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.0841242506256365, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018270976968369269}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.027017029568202292, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014828730907298778}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.10299041387162453, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0029846982659956075}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03514871886969164, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011146408262655305}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06194176556417661, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002469243942808823}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2264836217634177, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00433268038244018}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07737030634527048, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016531878395951427}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06286672427102329, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002521739438447608}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.22562189058095142, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004207794303094894}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07803274538661605, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016759567284788054}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..5e5d84aa507b0d6185ebc76df7726aaa63f23c99 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3280132335844989, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.023397817639014704}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0644491309312055, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002168252601283438}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.26932324402478697, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004869448854108838}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08616965529606423, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017333332075431082}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.026688837851098213, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00144137777314208}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11232023057734815, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0031229809372560016}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0348005109489672, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001057061308651459}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05835398948355422, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002014413516440926}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24510976411983082, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004441288545500777}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07766746661115345, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015488126211683285}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05982295830374904, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020397591398194034}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.24879869028857263, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004418589131657239}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07959776724269638, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015771133465866834}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2d8041772dae752dc6c47ddd39afd5e4995554a9 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.34638515482577353, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.015291163912320053}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06391106809448908, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022299798579838675}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.27425504532607553, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004799759636672703}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.0880916672062598, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018284068254863554}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.026175962829444736, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013416093394333784}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11550668310546741, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003058036972217679}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.036072521136247385, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011506150158658523}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05713027372206721, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001991481877156521}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24716315799999466, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0043125243751206115}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07881332955128942, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001602085026744074}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.059367895890295445, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020685069924175725}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25477280658969237, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004397648802195207}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08169534672440366, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016715880286721457}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4243cbcdd95aacc56d17e165e4d0913751827a17 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3704624770003497, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03638159942943428}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05982634280444436, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018001262758726789}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2777138419634843, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004952916631808108}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08559857536619786, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016363130752602227}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02360102097448928, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000854243652157208}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.12042632696557598, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032866446467497232}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03505346120993315, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010090465429173114}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05383446823399059, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017041071876981678}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2500627435472675, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0044852293234451}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07654509455251524, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014639780726145254}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.055977403732155415, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017529438408709402}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25674832287427335, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00451833760788113}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07947542844329104, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015233699868767465}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..10a34054e51496680b52beee5739df32ab07246e --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.34948975698170615, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.023821938767836993}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.058510872569050076, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014977652612347687}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.27839964342296464, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004925790540801674}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08584051874793835, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0015622002417028488}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.023403315924946395, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007924389946385025}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.12173985471099795, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003270953240241298}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03527561542480963, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009617481477463297}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.052502534519531324, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013726859531974134}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24948504716127445, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004413042414587561}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07682570075935022, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013946187591393226}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05451930264143289, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014056245713133853}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25804555072515556, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004485018866773874}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.079801865581312, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014350152199570983}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..6411e8253574fcd6a55f420c0676dd7296e5cd22 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3520654919870807, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.027609734870300613}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06066641398573986, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019391074427159668}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.27264418002989005, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004798703480922437}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.0854739749972663, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016018030269853596}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02575665330833014, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0013664015126702937}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11728661099632723, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003159030312730633}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.034951021231894634, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009990590843116766}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.05442877601650985, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018622354837109474}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24215142547294755, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0042165672086959295}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.0757905577263458, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014241979978356996}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05680657817739951, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018856743142604026}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2521970662394448, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004360316207858167}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07931691685317459, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001477735740337954}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..95eb151364241d232ff2fa2130794337b807f3bb --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14402662945431702, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019964636983908577}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.224835520834695, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002534663076636594}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.15984310029967955, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017964555443949755}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.024253651892450524, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007830043238366567}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.03807915014193239, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011514900025684483}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.026484542226918303, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007149276960787613}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1089736641128092, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014490175204519933}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1749701135473759, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019676023959095718}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12162866229386085, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012526718135058654}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1346760996841278, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018704153662604697}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.21077414533420868, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023879704709676495}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.14948770603973066, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001676038166549879}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.1939811006947518, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05144840709887267}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..0828415ea76dfa68fb81018f569118070011f306 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1421779647141786, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00183899601619}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2328221252469704, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002523117541816358}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16323809480458262, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017781665840047188}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.023068734244902384, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006924316781711188}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.038394150548631906, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012070561863604995}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.026405299879801242, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007513499596621286}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10407135199844923, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012739274090963085}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1756629066815182, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001920166706499377}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12039709037310402, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012183558463707484}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13389561548404935, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017270516951590925}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.21986093946231267, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023909852118580966}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15379828585730648, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016655511240505972}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.329387173898731, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.050959742820502744}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e8bfa24656ab8c60251ef30908948619258bef6b --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1457832945742694, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019709762483393995}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.23637305672174788, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00247992475878217}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16632065161606457, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018066810527815245}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.025484778469339338, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007890273465689312}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04140023492730905, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012184459681475824}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.028604389417761292, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007628849403399381}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10769050653186357, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013738979743412702}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1810403836066358, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019346598459529787}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1241823537201758, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012458496339153408}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1369600906660757, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018450558019738083}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.22309275958929797, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00234205408760469}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15640138097648992, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016797214333223785}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.4424517914266726, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07020911999324617}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..86ef63363fc2ef2acc91c35b881bd251288a9d86 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.12998655695663616, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002189516833129907}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.20496486516154497, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028659172041743037}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.143979322470228, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020322874462190108}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.02321033760008198, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007517668617932092}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.03739800165990479, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012436961876240002}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.025681636061568994, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007575885700225844}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.09639136628498862, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015654498649897994}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.15704796853631195, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002245229184123941}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.10744111532164179, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014289232021387648}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.12253923603559544, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020589899658542553}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.19382819078757685, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027171877182869237}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.13580783797212667, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019069485763797925}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.6327965384480934, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04784558757070599}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..48ca38b7ed3d18027a1b5916d6885bb4b14d7444 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.046448930876018805, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018035348802430623}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07357293605788026, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025697179083559174}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.04993869263777386, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017400482796179053}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.009115547013068444, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007080420784229646}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.014379490534632422, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0008642671865072303}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.009405169337583598, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005257744049594801}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.03565948935943829, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013979177010115587}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.057422168791446994, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020177366914654244}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.038166867834712785, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012986554235132886}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.04362589861222556, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016994783987957273}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.06935466728288939, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002427541920224267}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.0469149420555244, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016335234715811244}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.3975830375151671, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03517002110590927}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d0bbf407fdd775db87416b536854e2ce5cc55923 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.007172892267383475, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0007917929568286087}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.011671122997395015, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0011606516791878689}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.007568370913695297, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007491159620591852}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.001264178384729475, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0001966473650926985}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0024796221258986603, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004192114120392164}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0013965027873250944, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00020572985862442358}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.005490417768289501, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005849801172714558}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.009413328535258628, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009398460308935353}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.005865552021821947, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005564517319441601}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.006712756393605032, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007345666949798625}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.010998399946717396, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0010932046581100556}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.007131866271390784, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007049678056309991}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 6.239939007315392e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 9.71466408645211e-07}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..bea980625f72fd4e25efdb6dcc19513600f6d0cc --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.9812514400249457, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05562262752722095}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.15847815457785414, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004328803941964481}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.12742700108402852, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0023559640853185737}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.10900954926081764, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020004132814706306}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.07159611132449242, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0037286287454660018}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.028548308692682663, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0008068071456433969}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.027201662156796255, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000788791139157471}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.1334388407711523, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003974193073139387}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.10337061722487395, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0018911584688758604}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.08788250933957609, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015590214437749034}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.14150177498276953, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004129595856079377}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.10875548432324901, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002033382683937447}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.09356044304033936, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001722161996359038}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..898d2bfb7901182b5869b06cceff2541d17586a8 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.2253192440366405, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07140167205007719}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3815177071515503, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.005218371241177884}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.3106318538579719, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0031963478818675803}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.26325944037191484, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022748072352886776}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.20178279286083556, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.005294112759514037}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.11654879964306347, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001824032288290023}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.10002146341400579, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014693572942374512}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.324114703856428, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.005097258650525136}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2500017558247758, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025922878822160645}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2113652311205057, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017419352055642414}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3390145444380815, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.005172645689386997}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.26174975224096514, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002787496997673839}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.22354194196380525, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019987653462617975}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..cabfe498131ee5705c8245c21363dbab6e999a20 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.968462167589187, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0809413455934123}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.37561041209802154, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004803576540487985}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.34542246645230873, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028469806255225247}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.29114774014783334, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021518045305416187}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.18697031703703257, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.004365267354030048}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.13946536473639037, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018038930024966585}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.11837013500076157, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014809679532815788}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.315951536990457, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004519636510616847}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2848990694431196, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024528350275542597}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2378485997813391, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017083954437583943}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.32795875851147216, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.004687306327421472}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.29047623226002345, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025636131138164543}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.24624266553405377, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001958228700135443}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ffc0352d7aa0db57838183e5d19da3f4549741a6 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.100413535925033, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10204084214961892}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.35577144203191385, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004537003722998761}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.3647244934358361, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002747523679173933}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.29715275676346536, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020593689131373845}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.17035987156923135, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0038407536951717567}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.15028814529506035, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018136946483250282}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.12236707177425063, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001437321932186944}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.29603811661828844, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.004152196775629119}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3006722948935132, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023586910132368166}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.24251170955511187, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016065436945657693}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.30701171887463186, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0043364855185944965}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.30602796565632656, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024654434831691296}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2502378170722232, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018582144974208202}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..4ecf19ee5ea12fafff7546d79bb3b5515aeec68e --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.302528506929725, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09159160557761398}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3457184925802193, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.004160231582604038}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.38873799656965313, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002639030454229803}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3106389862425593, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019745864967604964}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.1613981344463189, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0034319902981585207}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.16100746129847524, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017978172805353685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.12862161964342028, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001433312603510002}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.28411370893647675, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.003743798776985757}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.319390176337282, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023152107019332466}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.25227586868839813, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001559219635105758}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2963124375137464, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003972319515480073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.32622007058557423, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002450252978851981}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.26125127654019925, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018446022776906345}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..63d67d1c1556cf8078c1a5862e6318c29e62c156 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.2420502388251435, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11069521906199865}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.31078931466957455, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0035821838565772805}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.40928814978401035, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002513611780694676}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.31044786268293756, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001944681263041426}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.13661422794726982, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00268531843352623}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.17131478141957424, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001846264774766135}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.12861734204623188, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014302618265553057}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2514460944139299, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0030526186239578533}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3356791583944898, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002240539567274668}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2510224592044638, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015295416689170924}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.26462055977448007, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003336730030918389}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3452406840839544, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023886668900561766}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2617560668553504, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001820974367559263}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_0.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f0103155235036ddf6a7f40bbac437e9527b36d0 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.16316619187689388, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002890984890147137}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.31001559634568143, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003978659821378838}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20008656508370964, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002602919942357546}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03352547525672803, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014320698536196147}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06430340976455366, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00231938341604023}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04090748442736069, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014928104681925642}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12270675062564947, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0022927482127938856}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2338821411106156, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0031011088285461284}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1502142949913443, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020028080134693966}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12803202942224567, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002326732638749928}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24656433036848785, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003410843786433149}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15761386746032657, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021239498717418375}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4539286316534636, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10413341300371938}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_1.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1df4ae3b85aab641c4b879b916cba3fb4196e6ee --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11453236899619632, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016195986503994135}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2802645254992808, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003696829148468212}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.16026754839725937, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002152722052964271}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01742972704474614, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008103528180574307}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.04404260214452908, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020813739232181275}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.024638353865890434, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011382421012757812}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08816027894258283, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012193640200953474}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.21709258927943814, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002827223535684834}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12352821757343255, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016133160942209523}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0920451713692867, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013155981196239118}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2271186416361983, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003132670977496884}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12904870256695447, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017598213737764256}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.9965190176386574, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05559453420420461}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_2.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..89fe0949f42bceb0c7ca9b85b5a109c1d2074bd7 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11145983804593526, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014743643800890196}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.28045679367482057, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0034259770552426184}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.15769070631922, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001982981910213691}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.015152005516530816, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006754060180232467}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.039166379272577614, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017988727907617531}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.021605793985650032, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009634567881537258}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08486603983815774, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001085791049406374}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.21516366945216606, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0026703236853124913}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12029157280634108, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001476371836829727}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0901270375976316, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012216984674086196}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2285463112828528, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002980474602095322}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12777306089054677, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016653146013723525}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.8252686451228434, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06219441463160752}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_3.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a4d1a2c124247743b9cf80b79481c9824a4c2a7e --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1078263305297306, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017542085299995392}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2580253690370548, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0037660524996162735}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.14870537856013735, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022250373297856207}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.014571709458807564, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007101227457714503}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.03574556425775684, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017388222484751564}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.020403012896272645, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009871637156077466}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08197966655283043, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001292307383970243}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.1974050382443013, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0028035058486686956}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11315310318316395, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016139643872092233}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08677115079741256, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001375140243984192}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20995584785478394, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031091921366029267}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12007749682129613, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017680042779764178}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.8113683570520359, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06619825265722147}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_4.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e8f93c24398a80a314c53d2c90164b90e8b8e7af --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.03418472303276383, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00210110351555125}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.06304793651249774, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0035973524455498603}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04010781297274983, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022481684730005936}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.004145873623694822, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005061006325311766}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.008843875903750643, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0010081977796634128}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00536187053653973, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006114168649663856}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.027278513716520444, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017455746766801424}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.04970336071033803, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002848378744916723}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03144663530333203, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017459513025573287}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.02813790632578131, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018032712966730017}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.05107839677205752, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0029256027588574272}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03239030933843817, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018053015484972615}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.4568380418312376, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11240957017003458}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_5.json b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..220a2d93aa0a081e695d73ddcb8f517c658ac25f --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/agg.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0019374196381469005, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0005297555109388115}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0017199042758875617, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0004699087955021987}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0017758047725847756, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0004794001433637215}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0016417177155976152, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0004455222998055521}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0014066712761193988, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0003697747285853825}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0014811178551071952, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00039295568397820974}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0017493422405362358, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0004643643474163307}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0015674774510765171, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00042362427764150467}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0016076723854203951, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0004229539683443897}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.2435863834999107e-38, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.6010999120135594e-32}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..388ce79798555196c67f2b17f82d5ce57a9229e7 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0e899a0210b6e2a0caae3ab8176962320542ec41b175f43df82bc5ead8827dd +size 4032442 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c74e59f8be8a35663029933c08cd898ce340860f --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80f891160d93b34485acf2716c3d3a4a84b007666d21a325bed51cd57a06987 +size 5021691 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..25c4344f4072468d4936458189657fa2280e22ea --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6a5d1b2e02be79a31f73dd6287386820dea4a501aef989e1e099a84e35ca81b +size 5957618 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6e03999cf201316f952a88a0421608b0d6d4af04 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb4cafdf1805bb4a79cbd53878fa7c0481465bd70e1a96b8d394b03b2000e92b +size 6859836 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f8233bdbd2e7bcf721621de602da46945fbbe9fd --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ce85c0b0a221ba7f80d8cad060ef10c143cd8fe19050bcbae6a7ac4a0be5119 +size 7770014 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c981575d06e549b3ef9f55023ba5eb143f89bc48 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c69ef5a07ae415483e6721671ffa8fa1fd270930d41096d23ed7d13269c6915f +size 8674356 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..57524b51d917a091d3625f04ae1bfab654ccb920 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:881c8a34c1b9fcb270593423ddfe030badfb370bd9d112c93d917692ab5af34f +size 7660507 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b61a5c9f8c931f97097711428322aded1d2f8d09 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96c400ae74b8d418d1b508bfc04ac787d351b41167ad6d3a3ea7d40d32b17428 +size 13310523 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..aaa274aae8cdb8353248e7baf8553d83b2bf11e7 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53ec5160830fb6aeeae55b7d24df4a3f9a5289deb9d17eea94fdd976cb423013 +size 18910553 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3d91edded36973b86163b4bd03fcfd4326aecd1c --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fe822fc96c8fcfd390b5801ada309bbbb0b16f0f36f7494247128c9099e596c +size 24338760 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6d7c473b551eadba97abd7cf312cb8fd4241fbbe --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6ca27d810ce82a14c38df5b1685698c1cde41980b483eae7464ce33d57f153d +size 29477451 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..700c43e840aa2d7abae211bf2fc9d498b568d684 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8539672ae0075d916165c6741a27548970549302a0b43546251f9b11fc1988b9 +size 34800937 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..21f53fd7b3c0edf76f71f0039394936519928a01 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf22c38d4c74e78366451c7aca03ccf208ea105050e320283ee5ef16660b6a3f +size 3957522 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..23fe4c9300d487e48c4f04e2ede318a2746c9a8f --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e52db72bc4ce785c5a85ca852af71ed463b194dfdf3f6c8792954f7e72b1b401 +size 5195642 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1fb8d406fe9ec27da19ded7320765def0ff6c94a --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8aa35369f2ae13019bb9f74ae16458ac34c3a33db03495963408960deebf3dc0 +size 6317946 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..52455482bf853c8dae2f5367bfc4ecb67801c38f --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea32b62a356376e17e7eda001a79ef02438fdb779f44c67a53d836ba04e04e89 +size 7436612 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..552d0bac7fc68c69ac3b4a258208f197e90db305 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7508d00daf676ce31c8874ac20d5def188e52ef86bffe3bb477fa620de89827 +size 8540750 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dc393af6c308627a55dffbc70706c5a2e9b86822 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7428a541f3f8e8aa9dd8e944aebbca29eb6e6ee78be99cf4a63fc272803b7f1b +size 9679349 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_0.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b55c3e7c6ddc62bc8e0fca845d6532309d862fb6 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66a0414e3aeae9bc6d278b3e0678aaf3c7a1fedb14471d43e9b8ae4b5aceef13 +size 2790347 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_1.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e77ec46c3204a3e0a22a74e96964a7909866c2fb --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:854ebc8dd7ebd23afbbcf7c712ffd5e7fad6818ba47a7ee61284853c8a1cffef +size 5101680 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_2.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c7b6c0a9b404ab96304ff4f8570726f84a2f0d67 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3b7fcabc44b3ece5646d0fff6c745840bfd0fa7905305cc4040bf38e1c507e8 +size 7384348 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_3.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7a8d6ed8dfef63dcbf075ee97a074603d7d35b6f --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e6ae3a4d2fb7fe982c32ff68d46f0427b368b71a1bc359152a09ddc757f3c0a +size 9652523 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_4.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b651ad95912bceda588f6a82849907988c587476 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb562da09f66394dd6ff0396ca2da3eeabd69b7e219693af54387b2be249fbbf +size 11674534 diff --git a/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_5.jsonl b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d9d6b971b957fadfa96904c02817e27251d0dcfc --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/examples.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be311f7df56420ecda246b0c0f7515552baa7cb0b2d90ffb8bd165a33ef7a4b0 +size 13897575 diff --git a/4b284b1b9c4seed2/evaluation/generation/merged.csv b/4b284b1b9c4seed2/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..8b59748dac37f92281483a2324d5e16de9e521e1 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.027201662156796255 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.027201662156796255 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.10002146341400579 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.10002146341400579 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.11837013500076157 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.11837013500076157 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.12236707177425063 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.12236707177425063 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.12862161964342028 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.12862161964342028 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.12861734204623188 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.12861734204623188 +e2e_nlg_cleaned,5,average,multiple,0.1041998823392444 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.04090748442736069 +gem_xsum,0,median,rouge2_fmeasure,0.04090748442736069 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.024638353865890434 +gem_xsum,1,median,rouge2_fmeasure,0.024638353865890434 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.021605793985650032 +gem_xsum,2,median,rouge2_fmeasure,0.021605793985650032 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.020403012896272645 +gem_xsum,3,median,rouge2_fmeasure,0.020403012896272645 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.00536187053653973 +gem_xsum,4,median,rouge2_fmeasure,0.00536187053653973 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.0 +gem_xsum,5,median,rouge2_fmeasure,0.0 +gem_xsum,5,average,multiple,0.018819419285285587 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.03514871886969164 +web_nlg_en,0,median,rouge2_fmeasure,0.03514871886969164 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.0348005109489672 +web_nlg_en,1,median,rouge2_fmeasure,0.0348005109489672 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.036072521136247385 +web_nlg_en,2,median,rouge2_fmeasure,0.036072521136247385 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.03505346120993315 +web_nlg_en,3,median,rouge2_fmeasure,0.03505346120993315 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.03527561542480963 +web_nlg_en,4,median,rouge2_fmeasure,0.03527561542480963 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.034951021231894634 +web_nlg_en,5,median,rouge2_fmeasure,0.034951021231894634 +web_nlg_en,5,average,multiple,0.03521697480359061 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.026484542226918303 +wiki_lingua_en,0,median,rouge2_fmeasure,0.026484542226918303 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.026405299879801242 +wiki_lingua_en,1,median,rouge2_fmeasure,0.026405299879801242 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.028604389417761292 +wiki_lingua_en,2,median,rouge2_fmeasure,0.028604389417761292 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.025681636061568994 +wiki_lingua_en,3,median,rouge2_fmeasure,0.025681636061568994 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.009405169337583598 +wiki_lingua_en,4,median,rouge2_fmeasure,0.009405169337583598 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0013965027873250944 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0013965027873250944 +wiki_lingua_en,5,average,multiple,0.019662923285159752 diff --git a/4b284b1b9c4seed2/evaluation/generation/merged.json b/4b284b1b9c4seed2/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..884fbd90ed9eebf5ac9e912dc887f9ba0b4fb01e --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.2736384503031292, "bleu_stderr": 0.013761131588040647, "rouge1_fmeasure": 0.0841242506256365, "rouge1_fmeasure_stderr": 0.0018270976968369269, "rouge1_precision": 0.06743672908113135, "rouge1_precision_stderr": 0.002638252273936629, "rouge1_recall": 0.24234907953353363, "rouge1_recall_stderr": 0.004536576899675782, "rouge2_fmeasure": 0.03514871886969164, "rouge2_fmeasure_stderr": 0.0011146408262655305, "rouge2_precision": 0.027017029568202292, "rouge2_precision_stderr": 0.0014828730907298778, "rouge2_recall": 0.10299041387162453, "rouge2_recall_stderr": 0.0029846982659956075, "rougeL_fmeasure": 0.07737030634527048, "rougeL_fmeasure_stderr": 0.0016531878395951427, "rougeL_precision": 0.06194176556417661, "rougeL_precision_stderr": 0.002469243942808823, "rougeL_recall": 0.2264836217634177, "rougeL_recall_stderr": 0.00433268038244018, "rougeLsum_fmeasure": 0.07803274538661605, "rougeLsum_fmeasure_stderr": 0.0016759567284788054, "rougeLsum_precision": 0.06286672427102329, "rougeLsum_precision_stderr": 0.002521739438447608, "rougeLsum_recall": 0.22562189058095142, "rougeLsum_recall_stderr": 0.004207794303094894}}, "1": {"PALM_prompt": {"bleu": 0.3280132335844989, "bleu_stderr": 0.023397817639014704, "rouge1_fmeasure": 0.08616965529606423, "rouge1_fmeasure_stderr": 0.0017333332075431082, "rouge1_precision": 0.0644491309312055, "rouge1_precision_stderr": 0.002168252601283438, "rouge1_recall": 0.26932324402478697, "rouge1_recall_stderr": 0.004869448854108838, "rouge2_fmeasure": 0.0348005109489672, "rouge2_fmeasure_stderr": 0.001057061308651459, "rouge2_precision": 0.026688837851098213, "rouge2_precision_stderr": 0.00144137777314208, "rouge2_recall": 0.11232023057734815, "rouge2_recall_stderr": 0.0031229809372560016, "rougeL_fmeasure": 0.07766746661115345, "rougeL_fmeasure_stderr": 0.0015488126211683285, "rougeL_precision": 0.05835398948355422, "rougeL_precision_stderr": 0.002014413516440926, "rougeL_recall": 0.24510976411983082, "rougeL_recall_stderr": 0.004441288545500777, "rougeLsum_fmeasure": 0.07959776724269638, "rougeLsum_fmeasure_stderr": 0.0015771133465866834, "rougeLsum_precision": 0.05982295830374904, "rougeLsum_precision_stderr": 0.0020397591398194034, "rougeLsum_recall": 0.24879869028857263, "rougeLsum_recall_stderr": 0.004418589131657239}}, "2": {"PALM_prompt": {"bleu": 0.34638515482577353, "bleu_stderr": 0.015291163912320053, "rouge1_fmeasure": 0.0880916672062598, "rouge1_fmeasure_stderr": 0.0018284068254863554, "rouge1_precision": 0.06391106809448908, "rouge1_precision_stderr": 0.0022299798579838675, "rouge1_recall": 0.27425504532607553, "rouge1_recall_stderr": 0.004799759636672703, "rouge2_fmeasure": 0.036072521136247385, "rouge2_fmeasure_stderr": 0.0011506150158658523, "rouge2_precision": 0.026175962829444736, "rouge2_precision_stderr": 0.0013416093394333784, "rouge2_recall": 0.11550668310546741, "rouge2_recall_stderr": 0.003058036972217679, "rougeL_fmeasure": 0.07881332955128942, "rougeL_fmeasure_stderr": 0.001602085026744074, "rougeL_precision": 0.05713027372206721, "rougeL_precision_stderr": 0.001991481877156521, "rougeL_recall": 0.24716315799999466, "rougeL_recall_stderr": 0.0043125243751206115, "rougeLsum_fmeasure": 0.08169534672440366, "rougeLsum_fmeasure_stderr": 0.0016715880286721457, "rougeLsum_precision": 0.059367895890295445, "rougeLsum_precision_stderr": 0.0020685069924175725, "rougeLsum_recall": 0.25477280658969237, "rougeLsum_recall_stderr": 0.004397648802195207}}, "3": {"PALM_prompt": {"bleu": 0.3704624770003497, "bleu_stderr": 0.03638159942943428, "rouge1_fmeasure": 0.08559857536619786, "rouge1_fmeasure_stderr": 0.0016363130752602227, "rouge1_precision": 0.05982634280444436, "rouge1_precision_stderr": 0.0018001262758726789, "rouge1_recall": 0.2777138419634843, "rouge1_recall_stderr": 0.004952916631808108, "rouge2_fmeasure": 0.03505346120993315, "rouge2_fmeasure_stderr": 0.0010090465429173114, "rouge2_precision": 0.02360102097448928, "rouge2_precision_stderr": 0.000854243652157208, "rouge2_recall": 0.12042632696557598, "rouge2_recall_stderr": 0.0032866446467497232, "rougeL_fmeasure": 0.07654509455251524, "rougeL_fmeasure_stderr": 0.0014639780726145254, "rougeL_precision": 0.05383446823399059, "rougeL_precision_stderr": 0.0017041071876981678, "rougeL_recall": 0.2500627435472675, "rougeL_recall_stderr": 0.0044852293234451, "rougeLsum_fmeasure": 0.07947542844329104, "rougeLsum_fmeasure_stderr": 0.0015233699868767465, "rougeLsum_precision": 0.055977403732155415, "rougeLsum_precision_stderr": 0.0017529438408709402, "rougeLsum_recall": 0.25674832287427335, "rougeLsum_recall_stderr": 0.00451833760788113}}, "4": {"PALM_prompt": {"bleu": 0.34948975698170615, "bleu_stderr": 0.023821938767836993, "rouge1_fmeasure": 0.08584051874793835, "rouge1_fmeasure_stderr": 0.0015622002417028488, "rouge1_precision": 0.058510872569050076, "rouge1_precision_stderr": 0.0014977652612347687, "rouge1_recall": 0.27839964342296464, "rouge1_recall_stderr": 0.004925790540801674, "rouge2_fmeasure": 0.03527561542480963, "rouge2_fmeasure_stderr": 0.0009617481477463297, "rouge2_precision": 0.023403315924946395, "rouge2_precision_stderr": 0.0007924389946385025, "rouge2_recall": 0.12173985471099795, "rouge2_recall_stderr": 0.003270953240241298, "rougeL_fmeasure": 0.07682570075935022, "rougeL_fmeasure_stderr": 0.0013946187591393226, "rougeL_precision": 0.052502534519531324, "rougeL_precision_stderr": 0.0013726859531974134, "rougeL_recall": 0.24948504716127445, "rougeL_recall_stderr": 0.004413042414587561, "rougeLsum_fmeasure": 0.079801865581312, "rougeLsum_fmeasure_stderr": 0.0014350152199570983, "rougeLsum_precision": 0.05451930264143289, "rougeLsum_precision_stderr": 0.0014056245713133853, "rougeLsum_recall": 0.25804555072515556, "rougeLsum_recall_stderr": 0.004485018866773874}}, "5": {"PALM_prompt": {"bleu": 0.3520654919870807, "bleu_stderr": 0.027609734870300613, "rouge1_fmeasure": 0.0854739749972663, "rouge1_fmeasure_stderr": 0.0016018030269853596, "rouge1_precision": 0.06066641398573986, "rouge1_precision_stderr": 0.0019391074427159668, "rouge1_recall": 0.27264418002989005, "rouge1_recall_stderr": 0.004798703480922437, "rouge2_fmeasure": 0.034951021231894634, "rouge2_fmeasure_stderr": 0.0009990590843116766, "rouge2_precision": 0.02575665330833014, "rouge2_precision_stderr": 0.0013664015126702937, "rouge2_recall": 0.11728661099632723, "rouge2_recall_stderr": 0.003159030312730633, "rougeL_fmeasure": 0.0757905577263458, "rougeL_fmeasure_stderr": 0.0014241979978356996, "rougeL_precision": 0.05442877601650985, "rougeL_precision_stderr": 0.0018622354837109474, "rougeL_recall": 0.24215142547294755, "rougeL_recall_stderr": 0.0042165672086959295, "rougeLsum_fmeasure": 0.07931691685317459, "rougeLsum_fmeasure_stderr": 0.001477735740337954, "rougeLsum_precision": 0.05680657817739951, "rougeLsum_precision_stderr": 0.0018856743142604026, "rougeLsum_recall": 0.2521970662394448, "rougeLsum_recall_stderr": 0.004360316207858167}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.1939811006947518, "bleu_stderr": 0.05144840709887267, "rouge1_fmeasure": 0.15984310029967955, "rouge1_fmeasure_stderr": 0.0017964555443949755, "rouge1_precision": 0.14402662945431702, "rouge1_precision_stderr": 0.0019964636983908577, "rouge1_recall": 0.224835520834695, "rouge1_recall_stderr": 0.002534663076636594, "rouge2_fmeasure": 0.026484542226918303, "rouge2_fmeasure_stderr": 0.0007149276960787613, "rouge2_precision": 0.024253651892450524, "rouge2_precision_stderr": 0.0007830043238366567, "rouge2_recall": 0.03807915014193239, "rouge2_recall_stderr": 0.0011514900025684483, "rougeL_fmeasure": 0.12162866229386085, "rougeL_fmeasure_stderr": 0.0012526718135058654, "rougeL_precision": 0.1089736641128092, "rougeL_precision_stderr": 0.0014490175204519933, "rougeL_recall": 0.1749701135473759, "rougeL_recall_stderr": 0.0019676023959095718, "rougeLsum_fmeasure": 0.14948770603973066, "rougeLsum_fmeasure_stderr": 0.001676038166549879, "rougeLsum_precision": 0.1346760996841278, "rougeLsum_precision_stderr": 0.0018704153662604697, "rougeLsum_recall": 0.21077414533420868, "rougeLsum_recall_stderr": 0.0023879704709676495}}, "1": {"tldr_en": {"bleu": 1.329387173898731, "bleu_stderr": 0.050959742820502744, "rouge1_fmeasure": 0.16323809480458262, "rouge1_fmeasure_stderr": 0.0017781665840047188, "rouge1_precision": 0.1421779647141786, "rouge1_precision_stderr": 0.00183899601619, "rouge1_recall": 0.2328221252469704, "rouge1_recall_stderr": 0.002523117541816358, "rouge2_fmeasure": 0.026405299879801242, "rouge2_fmeasure_stderr": 0.0007513499596621286, "rouge2_precision": 0.023068734244902384, "rouge2_precision_stderr": 0.0006924316781711188, "rouge2_recall": 0.038394150548631906, "rouge2_recall_stderr": 0.0012070561863604995, "rougeL_fmeasure": 0.12039709037310402, "rougeL_fmeasure_stderr": 0.0012183558463707484, "rougeL_precision": 0.10407135199844923, "rougeL_precision_stderr": 0.0012739274090963085, "rougeL_recall": 0.1756629066815182, "rougeL_recall_stderr": 0.001920166706499377, "rougeLsum_fmeasure": 0.15379828585730648, "rougeLsum_fmeasure_stderr": 0.0016655511240505972, "rougeLsum_precision": 0.13389561548404935, "rougeLsum_precision_stderr": 0.0017270516951590925, "rougeLsum_recall": 0.21986093946231267, "rougeLsum_recall_stderr": 0.0023909852118580966}}, "2": {"tldr_en": {"bleu": 1.4424517914266726, "bleu_stderr": 0.07020911999324617, "rouge1_fmeasure": 0.16632065161606457, "rouge1_fmeasure_stderr": 0.0018066810527815245, "rouge1_precision": 0.1457832945742694, "rouge1_precision_stderr": 0.0019709762483393995, "rouge1_recall": 0.23637305672174788, "rouge1_recall_stderr": 0.00247992475878217, "rouge2_fmeasure": 0.028604389417761292, "rouge2_fmeasure_stderr": 0.0007628849403399381, "rouge2_precision": 0.025484778469339338, "rouge2_precision_stderr": 0.0007890273465689312, "rouge2_recall": 0.04140023492730905, "rouge2_recall_stderr": 0.0012184459681475824, "rougeL_fmeasure": 0.1241823537201758, "rougeL_fmeasure_stderr": 0.0012458496339153408, "rougeL_precision": 0.10769050653186357, "rougeL_precision_stderr": 0.0013738979743412702, "rougeL_recall": 0.1810403836066358, "rougeL_recall_stderr": 0.0019346598459529787, "rougeLsum_fmeasure": 0.15640138097648992, "rougeLsum_fmeasure_stderr": 0.0016797214333223785, "rougeLsum_precision": 0.1369600906660757, "rougeLsum_precision_stderr": 0.0018450558019738083, "rougeLsum_recall": 0.22309275958929797, "rougeLsum_recall_stderr": 0.00234205408760469}}, "3": {"tldr_en": {"bleu": 1.6327965384480934, "bleu_stderr": 0.04784558757070599, "rouge1_fmeasure": 0.143979322470228, "rouge1_fmeasure_stderr": 0.0020322874462190108, "rouge1_precision": 0.12998655695663616, "rouge1_precision_stderr": 0.002189516833129907, "rouge1_recall": 0.20496486516154497, "rouge1_recall_stderr": 0.0028659172041743037, "rouge2_fmeasure": 0.025681636061568994, "rouge2_fmeasure_stderr": 0.0007575885700225844, "rouge2_precision": 0.02321033760008198, "rouge2_precision_stderr": 0.0007517668617932092, "rouge2_recall": 0.03739800165990479, "rouge2_recall_stderr": 0.0012436961876240002, "rougeL_fmeasure": 0.10744111532164179, "rougeL_fmeasure_stderr": 0.0014289232021387648, "rougeL_precision": 0.09639136628498862, "rougeL_precision_stderr": 0.0015654498649897994, "rougeL_recall": 0.15704796853631195, "rougeL_recall_stderr": 0.002245229184123941, "rougeLsum_fmeasure": 0.13580783797212667, "rougeLsum_fmeasure_stderr": 0.0019069485763797925, "rougeLsum_precision": 0.12253923603559544, "rougeLsum_precision_stderr": 0.0020589899658542553, "rougeLsum_recall": 0.19382819078757685, "rougeLsum_recall_stderr": 0.0027171877182869237}}, "4": {"tldr_en": {"bleu": 0.3975830375151671, "bleu_stderr": 0.03517002110590927, "rouge1_fmeasure": 0.04993869263777386, "rouge1_fmeasure_stderr": 0.0017400482796179053, "rouge1_precision": 0.046448930876018805, "rouge1_precision_stderr": 0.0018035348802430623, "rouge1_recall": 0.07357293605788026, "rouge1_recall_stderr": 0.0025697179083559174, "rouge2_fmeasure": 0.009405169337583598, "rouge2_fmeasure_stderr": 0.0005257744049594801, "rouge2_precision": 0.009115547013068444, "rouge2_precision_stderr": 0.0007080420784229646, "rouge2_recall": 0.014379490534632422, "rouge2_recall_stderr": 0.0008642671865072303, "rougeL_fmeasure": 0.038166867834712785, "rougeL_fmeasure_stderr": 0.0012986554235132886, "rougeL_precision": 0.03565948935943829, "rougeL_precision_stderr": 0.0013979177010115587, "rougeL_recall": 0.057422168791446994, "rougeL_recall_stderr": 0.0020177366914654244, "rougeLsum_fmeasure": 0.0469149420555244, "rougeLsum_fmeasure_stderr": 0.0016335234715811244, "rougeLsum_precision": 0.04362589861222556, "rougeLsum_precision_stderr": 0.0016994783987957273, "rougeLsum_recall": 0.06935466728288939, "rougeLsum_recall_stderr": 0.002427541920224267}}, "5": {"tldr_en": {"bleu": 6.239939007315392e-07, "bleu_stderr": 9.71466408645211e-07, "rouge1_fmeasure": 0.007568370913695297, "rouge1_fmeasure_stderr": 0.0007491159620591852, "rouge1_precision": 0.007172892267383475, "rouge1_precision_stderr": 0.0007917929568286087, "rouge1_recall": 0.011671122997395015, "rouge1_recall_stderr": 0.0011606516791878689, "rouge2_fmeasure": 0.0013965027873250944, "rouge2_fmeasure_stderr": 0.00020572985862442358, "rouge2_precision": 0.001264178384729475, "rouge2_precision_stderr": 0.0001966473650926985, "rouge2_recall": 0.0024796221258986603, "rouge2_recall_stderr": 0.0004192114120392164, "rougeL_fmeasure": 0.005865552021821947, "rougeL_fmeasure_stderr": 0.0005564517319441601, "rougeL_precision": 0.005490417768289501, "rougeL_precision_stderr": 0.0005849801172714558, "rougeL_recall": 0.009413328535258628, "rougeL_recall_stderr": 0.0009398460308935353, "rougeLsum_fmeasure": 0.007131866271390784, "rougeLsum_fmeasure_stderr": 0.0007049678056309991, "rougeLsum_precision": 0.006712756393605032, "rougeLsum_precision_stderr": 0.0007345666949798625, "rougeLsum_recall": 0.010998399946717396, "rougeLsum_recall_stderr": 0.0010932046581100556}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.9812514400249457, "bleu_stderr": 0.05562262752722095, "rouge1_fmeasure": 0.10900954926081764, "rouge1_fmeasure_stderr": 0.0020004132814706306, "rouge1_precision": 0.15847815457785414, "rouge1_precision_stderr": 0.004328803941964481, "rouge1_recall": 0.12742700108402852, "rouge1_recall_stderr": 0.0023559640853185737, "rouge2_fmeasure": 0.027201662156796255, "rouge2_fmeasure_stderr": 0.000788791139157471, "rouge2_precision": 0.07159611132449242, "rouge2_precision_stderr": 0.0037286287454660018, "rouge2_recall": 0.028548308692682663, "rouge2_recall_stderr": 0.0008068071456433969, "rougeL_fmeasure": 0.08788250933957609, "rougeL_fmeasure_stderr": 0.0015590214437749034, "rougeL_precision": 0.1334388407711523, "rougeL_precision_stderr": 0.003974193073139387, "rougeL_recall": 0.10337061722487395, "rougeL_recall_stderr": 0.0018911584688758604, "rougeLsum_fmeasure": 0.09356044304033936, "rougeLsum_fmeasure_stderr": 0.001722161996359038, "rougeLsum_precision": 0.14150177498276953, "rougeLsum_precision_stderr": 0.004129595856079377, "rougeLsum_recall": 0.10875548432324901, "rougeLsum_recall_stderr": 0.002033382683937447}}, "1": {"generate_text_restaurant": {"bleu": 5.2253192440366405, "bleu_stderr": 0.07140167205007719, "rouge1_fmeasure": 0.26325944037191484, "rouge1_fmeasure_stderr": 0.0022748072352886776, "rouge1_precision": 0.3815177071515503, "rouge1_precision_stderr": 0.005218371241177884, "rouge1_recall": 0.3106318538579719, "rouge1_recall_stderr": 0.0031963478818675803, "rouge2_fmeasure": 0.10002146341400579, "rouge2_fmeasure_stderr": 0.0014693572942374512, "rouge2_precision": 0.20178279286083556, "rouge2_precision_stderr": 0.005294112759514037, "rouge2_recall": 0.11654879964306347, "rouge2_recall_stderr": 0.001824032288290023, "rougeL_fmeasure": 0.2113652311205057, "rougeL_fmeasure_stderr": 0.0017419352055642414, "rougeL_precision": 0.324114703856428, "rougeL_precision_stderr": 0.005097258650525136, "rougeL_recall": 0.2500017558247758, "rougeL_recall_stderr": 0.0025922878822160645, "rougeLsum_fmeasure": 0.22354194196380525, "rougeLsum_fmeasure_stderr": 0.0019987653462617975, "rougeLsum_precision": 0.3390145444380815, "rougeLsum_precision_stderr": 0.005172645689386997, "rougeLsum_recall": 0.26174975224096514, "rougeLsum_recall_stderr": 0.002787496997673839}}, "2": {"generate_text_restaurant": {"bleu": 5.968462167589187, "bleu_stderr": 0.0809413455934123, "rouge1_fmeasure": 0.29114774014783334, "rouge1_fmeasure_stderr": 0.0021518045305416187, "rouge1_precision": 0.37561041209802154, "rouge1_precision_stderr": 0.004803576540487985, "rouge1_recall": 0.34542246645230873, "rouge1_recall_stderr": 0.0028469806255225247, "rouge2_fmeasure": 0.11837013500076157, "rouge2_fmeasure_stderr": 0.0014809679532815788, "rouge2_precision": 0.18697031703703257, "rouge2_precision_stderr": 0.004365267354030048, "rouge2_recall": 0.13946536473639037, "rouge2_recall_stderr": 0.0018038930024966585, "rougeL_fmeasure": 0.2378485997813391, "rougeL_fmeasure_stderr": 0.0017083954437583943, "rougeL_precision": 0.315951536990457, "rougeL_precision_stderr": 0.004519636510616847, "rougeL_recall": 0.2848990694431196, "rougeL_recall_stderr": 0.0024528350275542597, "rougeLsum_fmeasure": 0.24624266553405377, "rougeLsum_fmeasure_stderr": 0.001958228700135443, "rougeLsum_precision": 0.32795875851147216, "rougeLsum_precision_stderr": 0.004687306327421472, "rougeLsum_recall": 0.29047623226002345, "rougeLsum_recall_stderr": 0.0025636131138164543}}, "3": {"generate_text_restaurant": {"bleu": 6.100413535925033, "bleu_stderr": 0.10204084214961892, "rouge1_fmeasure": 0.29715275676346536, "rouge1_fmeasure_stderr": 0.0020593689131373845, "rouge1_precision": 0.35577144203191385, "rouge1_precision_stderr": 0.004537003722998761, "rouge1_recall": 0.3647244934358361, "rouge1_recall_stderr": 0.002747523679173933, "rouge2_fmeasure": 0.12236707177425063, "rouge2_fmeasure_stderr": 0.001437321932186944, "rouge2_precision": 0.17035987156923135, "rouge2_precision_stderr": 0.0038407536951717567, "rouge2_recall": 0.15028814529506035, "rouge2_recall_stderr": 0.0018136946483250282, "rougeL_fmeasure": 0.24251170955511187, "rougeL_fmeasure_stderr": 0.0016065436945657693, "rougeL_precision": 0.29603811661828844, "rougeL_precision_stderr": 0.004152196775629119, "rougeL_recall": 0.3006722948935132, "rougeL_recall_stderr": 0.0023586910132368166, "rougeLsum_fmeasure": 0.2502378170722232, "rougeLsum_fmeasure_stderr": 0.0018582144974208202, "rougeLsum_precision": 0.30701171887463186, "rougeLsum_precision_stderr": 0.0043364855185944965, "rougeLsum_recall": 0.30602796565632656, "rougeLsum_recall_stderr": 0.0024654434831691296}}, "4": {"generate_text_restaurant": {"bleu": 6.302528506929725, "bleu_stderr": 0.09159160557761398, "rouge1_fmeasure": 0.3106389862425593, "rouge1_fmeasure_stderr": 0.0019745864967604964, "rouge1_precision": 0.3457184925802193, "rouge1_precision_stderr": 0.004160231582604038, "rouge1_recall": 0.38873799656965313, "rouge1_recall_stderr": 0.002639030454229803, "rouge2_fmeasure": 0.12862161964342028, "rouge2_fmeasure_stderr": 0.001433312603510002, "rouge2_precision": 0.1613981344463189, "rouge2_precision_stderr": 0.0034319902981585207, "rouge2_recall": 0.16100746129847524, "rouge2_recall_stderr": 0.0017978172805353685, "rougeL_fmeasure": 0.25227586868839813, "rougeL_fmeasure_stderr": 0.001559219635105758, "rougeL_precision": 0.28411370893647675, "rougeL_precision_stderr": 0.003743798776985757, "rougeL_recall": 0.319390176337282, "rougeL_recall_stderr": 0.0023152107019332466, "rougeLsum_fmeasure": 0.26125127654019925, "rougeLsum_fmeasure_stderr": 0.0018446022776906345, "rougeLsum_precision": 0.2963124375137464, "rougeLsum_precision_stderr": 0.003972319515480073, "rougeLsum_recall": 0.32622007058557423, "rougeLsum_recall_stderr": 0.002450252978851981}}, "5": {"generate_text_restaurant": {"bleu": 6.2420502388251435, "bleu_stderr": 0.11069521906199865, "rouge1_fmeasure": 0.31044786268293756, "rouge1_fmeasure_stderr": 0.001944681263041426, "rouge1_precision": 0.31078931466957455, "rouge1_precision_stderr": 0.0035821838565772805, "rouge1_recall": 0.40928814978401035, "rouge1_recall_stderr": 0.002513611780694676, "rouge2_fmeasure": 0.12861734204623188, "rouge2_fmeasure_stderr": 0.0014302618265553057, "rouge2_precision": 0.13661422794726982, "rouge2_precision_stderr": 0.00268531843352623, "rouge2_recall": 0.17131478141957424, "rouge2_recall_stderr": 0.001846264774766135, "rougeL_fmeasure": 0.2510224592044638, "rougeL_fmeasure_stderr": 0.0015295416689170924, "rougeL_precision": 0.2514460944139299, "rougeL_precision_stderr": 0.0030526186239578533, "rougeL_recall": 0.3356791583944898, "rougeL_recall_stderr": 0.002240539567274668, "rougeLsum_fmeasure": 0.2617560668553504, "rougeLsum_fmeasure_stderr": 0.001820974367559263, "rougeLsum_precision": 0.26462055977448007, "rougeLsum_precision_stderr": 0.003336730030918389, "rougeLsum_recall": 0.3452406840839544, "rougeLsum_recall_stderr": 0.0023886668900561766}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.4539286316534636, "bleu_stderr": 0.10413341300371938, "rouge1_fmeasure": 0.20008656508370964, "rouge1_fmeasure_stderr": 0.002602919942357546, "rouge1_precision": 0.16316619187689388, "rouge1_precision_stderr": 0.002890984890147137, "rouge1_recall": 0.31001559634568143, "rouge1_recall_stderr": 0.003978659821378838, "rouge2_fmeasure": 0.04090748442736069, "rouge2_fmeasure_stderr": 0.0014928104681925642, "rouge2_precision": 0.03352547525672803, "rouge2_precision_stderr": 0.0014320698536196147, "rouge2_recall": 0.06430340976455366, "rouge2_recall_stderr": 0.00231938341604023, "rougeL_fmeasure": 0.1502142949913443, "rougeL_fmeasure_stderr": 0.0020028080134693966, "rougeL_precision": 0.12270675062564947, "rougeL_precision_stderr": 0.0022927482127938856, "rougeL_recall": 0.2338821411106156, "rougeL_recall_stderr": 0.0031011088285461284, "rougeLsum_fmeasure": 0.15761386746032657, "rougeLsum_fmeasure_stderr": 0.0021239498717418375, "rougeLsum_precision": 0.12803202942224567, "rougeLsum_precision_stderr": 0.002326732638749928, "rougeLsum_recall": 0.24656433036848785, "rougeLsum_recall_stderr": 0.003410843786433149}}, "1": {"article_DOC_summary": {"bleu": 0.9965190176386574, "bleu_stderr": 0.05559453420420461, "rouge1_fmeasure": 0.16026754839725937, "rouge1_fmeasure_stderr": 0.002152722052964271, "rouge1_precision": 0.11453236899619632, "rouge1_precision_stderr": 0.0016195986503994135, "rouge1_recall": 0.2802645254992808, "rouge1_recall_stderr": 0.003696829148468212, "rouge2_fmeasure": 0.024638353865890434, "rouge2_fmeasure_stderr": 0.0011382421012757812, "rouge2_precision": 0.01742972704474614, "rouge2_precision_stderr": 0.0008103528180574307, "rouge2_recall": 0.04404260214452908, "rouge2_recall_stderr": 0.0020813739232181275, "rougeL_fmeasure": 0.12352821757343255, "rougeL_fmeasure_stderr": 0.0016133160942209523, "rougeL_precision": 0.08816027894258283, "rougeL_precision_stderr": 0.0012193640200953474, "rougeL_recall": 0.21709258927943814, "rougeL_recall_stderr": 0.002827223535684834, "rougeLsum_fmeasure": 0.12904870256695447, "rougeLsum_fmeasure_stderr": 0.0017598213737764256, "rougeLsum_precision": 0.0920451713692867, "rougeLsum_precision_stderr": 0.0013155981196239118, "rougeLsum_recall": 0.2271186416361983, "rougeLsum_recall_stderr": 0.003132670977496884}}, "2": {"article_DOC_summary": {"bleu": 0.8252686451228434, "bleu_stderr": 0.06219441463160752, "rouge1_fmeasure": 0.15769070631922, "rouge1_fmeasure_stderr": 0.001982981910213691, "rouge1_precision": 0.11145983804593526, "rouge1_precision_stderr": 0.0014743643800890196, "rouge1_recall": 0.28045679367482057, "rouge1_recall_stderr": 0.0034259770552426184, "rouge2_fmeasure": 0.021605793985650032, "rouge2_fmeasure_stderr": 0.0009634567881537258, "rouge2_precision": 0.015152005516530816, "rouge2_precision_stderr": 0.0006754060180232467, "rouge2_recall": 0.039166379272577614, "rouge2_recall_stderr": 0.0017988727907617531, "rougeL_fmeasure": 0.12029157280634108, "rougeL_fmeasure_stderr": 0.001476371836829727, "rougeL_precision": 0.08486603983815774, "rougeL_precision_stderr": 0.001085791049406374, "rougeL_recall": 0.21516366945216606, "rougeL_recall_stderr": 0.0026703236853124913, "rougeLsum_fmeasure": 0.12777306089054677, "rougeLsum_fmeasure_stderr": 0.0016653146013723525, "rougeLsum_precision": 0.0901270375976316, "rougeLsum_precision_stderr": 0.0012216984674086196, "rougeLsum_recall": 0.2285463112828528, "rougeLsum_recall_stderr": 0.002980474602095322}}, "3": {"article_DOC_summary": {"bleu": 0.8113683570520359, "bleu_stderr": 0.06619825265722147, "rouge1_fmeasure": 0.14870537856013735, "rouge1_fmeasure_stderr": 0.0022250373297856207, "rouge1_precision": 0.1078263305297306, "rouge1_precision_stderr": 0.0017542085299995392, "rouge1_recall": 0.2580253690370548, "rouge1_recall_stderr": 0.0037660524996162735, "rouge2_fmeasure": 0.020403012896272645, "rouge2_fmeasure_stderr": 0.0009871637156077466, "rouge2_precision": 0.014571709458807564, "rouge2_precision_stderr": 0.0007101227457714503, "rouge2_recall": 0.03574556425775684, "rouge2_recall_stderr": 0.0017388222484751564, "rougeL_fmeasure": 0.11315310318316395, "rougeL_fmeasure_stderr": 0.0016139643872092233, "rougeL_precision": 0.08197966655283043, "rougeL_precision_stderr": 0.001292307383970243, "rougeL_recall": 0.1974050382443013, "rougeL_recall_stderr": 0.0028035058486686956, "rougeLsum_fmeasure": 0.12007749682129613, "rougeLsum_fmeasure_stderr": 0.0017680042779764178, "rougeLsum_precision": 0.08677115079741256, "rougeLsum_precision_stderr": 0.001375140243984192, "rougeLsum_recall": 0.20995584785478394, "rougeLsum_recall_stderr": 0.0031091921366029267}}, "4": {"article_DOC_summary": {"bleu": 0.4568380418312376, "bleu_stderr": 0.11240957017003458, "rouge1_fmeasure": 0.04010781297274983, "rouge1_fmeasure_stderr": 0.0022481684730005936, "rouge1_precision": 0.03418472303276383, "rouge1_precision_stderr": 0.00210110351555125, "rouge1_recall": 0.06304793651249774, "rouge1_recall_stderr": 0.0035973524455498603, "rouge2_fmeasure": 0.00536187053653973, "rouge2_fmeasure_stderr": 0.0006114168649663856, "rouge2_precision": 0.004145873623694822, "rouge2_precision_stderr": 0.0005061006325311766, "rouge2_recall": 0.008843875903750643, "rouge2_recall_stderr": 0.0010081977796634128, "rougeL_fmeasure": 0.03144663530333203, "rougeL_fmeasure_stderr": 0.0017459513025573287, "rougeL_precision": 0.027278513716520444, "rougeL_precision_stderr": 0.0017455746766801424, "rougeL_recall": 0.04970336071033803, "rougeL_recall_stderr": 0.002848378744916723, "rougeLsum_fmeasure": 0.03239030933843817, "rougeLsum_fmeasure_stderr": 0.0018053015484972615, "rougeLsum_precision": 0.02813790632578131, "rougeLsum_precision_stderr": 0.0018032712966730017, "rougeLsum_recall": 0.05107839677205752, "rougeLsum_recall_stderr": 0.0029256027588574272}}, "5": {"article_DOC_summary": {"bleu": 1.2435863834999107e-38, "bleu_stderr": 1.6010999120135594e-32, "rouge1_fmeasure": 0.0017758047725847756, "rouge1_fmeasure_stderr": 0.0004794001433637215, "rouge1_precision": 0.0019374196381469005, "rouge1_precision_stderr": 0.0005297555109388115, "rouge1_recall": 0.0017199042758875617, "rouge1_recall_stderr": 0.0004699087955021987, "rouge2_fmeasure": 0.0, "rouge2_fmeasure_stderr": 0.0, "rouge2_precision": 0.0, "rouge2_precision_stderr": 0.0, "rouge2_recall": 0.0, "rouge2_recall_stderr": 0.0, "rougeL_fmeasure": 0.0014811178551071952, "rougeL_fmeasure_stderr": 0.00039295568397820974, "rougeL_precision": 0.0016417177155976152, "rougeL_precision_stderr": 0.0004455222998055521, "rougeL_recall": 0.0014066712761193988, "rougeL_recall_stderr": 0.0003697747285853825, "rougeLsum_fmeasure": 0.0016076723854203951, "rougeLsum_fmeasure_stderr": 0.0004229539683443897, "rougeLsum_precision": 0.0017493422405362358, "rougeLsum_precision_stderr": 0.0004643643474163307, "rougeLsum_recall": 0.0015674774510765171, "rougeLsum_recall_stderr": 0.00042362427764150467}}}} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4116912a9afce6e13fafd4a0eeea32cb2d120154 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.2736384503031292, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.013761131588040647 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06743672908113135, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002638252273936629 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.24234907953353363, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004536576899675782 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.0841242506256365, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018270976968369269 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.027017029568202292, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0014828730907298778 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.10299041387162453, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0029846982659956075 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03514871886969164, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011146408262655305 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06194176556417661, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002469243942808823 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2264836217634177, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00433268038244018 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07737030634527048, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016531878395951427 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06286672427102329, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002521739438447608 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.22562189058095142, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004207794303094894 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07803274538661605, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016759567284788054 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e790fb36e18a58a521e7c5a65cde5d8766c80478 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3280132335844989, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.023397817639014704 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0644491309312055, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002168252601283438 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.26932324402478697, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004869448854108838 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08616965529606423, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017333332075431082 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.026688837851098213, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00144137777314208 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11232023057734815, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0031229809372560016 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0348005109489672, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001057061308651459 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05835398948355422, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002014413516440926 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24510976411983082, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004441288545500777 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07766746661115345, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015488126211683285 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05982295830374904, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020397591398194034 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.24879869028857263, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004418589131657239 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07959776724269638, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015771133465866834 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f61d8fb1cf36d348e49789afc09e8e7b4057cecc --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.34638515482577353, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.015291163912320053 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06391106809448908, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0022299798579838675 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.27425504532607553, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004799759636672703 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.0880916672062598, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018284068254863554 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.026175962829444736, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0013416093394333784 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11550668310546741, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003058036972217679 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.036072521136247385, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011506150158658523 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05713027372206721, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001991481877156521 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24716315799999466, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0043125243751206115 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07881332955128942, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001602085026744074 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.059367895890295445, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020685069924175725 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25477280658969237, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004397648802195207 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08169534672440366, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016715880286721457 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c540ce7bd374a106b801535ec988e08f8620175d --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3704624770003497, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03638159942943428 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05982634280444436, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018001262758726789 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2777138419634843, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004952916631808108 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08559857536619786, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016363130752602227 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02360102097448928, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000854243652157208 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.12042632696557598, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032866446467497232 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03505346120993315, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010090465429173114 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05383446823399059, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017041071876981678 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2500627435472675, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0044852293234451 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07654509455251524, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014639780726145254 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.055977403732155415, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017529438408709402 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25674832287427335, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00451833760788113 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07947542844329104, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015233699868767465 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d97b48904ed92f4af7f5343f84f7a0b4bb827773 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.34948975698170615, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.023821938767836993 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.058510872569050076, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014977652612347687 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.27839964342296464, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004925790540801674 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08584051874793835, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0015622002417028488 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.023403315924946395, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007924389946385025 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.12173985471099795, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003270953240241298 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03527561542480963, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009617481477463297 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.052502534519531324, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013726859531974134 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24948504716127445, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004413042414587561 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07682570075935022, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013946187591393226 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05451930264143289, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014056245713133853 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25804555072515556, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004485018866773874 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.079801865581312, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014350152199570983 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..64e1feebee5b3bb72e04022cd2ae93beac5f8527 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3520654919870807, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.027609734870300613 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06066641398573986, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019391074427159668 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.27264418002989005, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004798703480922437 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.0854739749972663, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016018030269853596 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02575665330833014, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0013664015126702937 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11728661099632723, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003159030312730633 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.034951021231894634, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009990590843116766 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.05442877601650985, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0018622354837109474 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24215142547294755, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0042165672086959295 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.0757905577263458, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014241979978356996 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05680657817739951, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018856743142604026 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2521970662394448, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004360316207858167 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07931691685317459, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001477735740337954 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..57a0c6ace81e0871ff311af08fbc246739767ee1 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14402662945431702, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019964636983908577 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.224835520834695, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002534663076636594 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.15984310029967955, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017964555443949755 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.024253651892450524, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007830043238366567 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.03807915014193239, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011514900025684483 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.026484542226918303, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007149276960787613 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1089736641128092, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014490175204519933 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1749701135473759, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019676023959095718 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12162866229386085, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012526718135058654 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1346760996841278, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018704153662604697 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.21077414533420868, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023879704709676495 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.14948770603973066, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001676038166549879 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.1939811006947518, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05144840709887267 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..15242f02bc94535ba2d020fbed63668f0ae7fcd6 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1421779647141786, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00183899601619 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2328221252469704, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002523117541816358 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16323809480458262, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017781665840047188 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.023068734244902384, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006924316781711188 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.038394150548631906, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012070561863604995 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.026405299879801242, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007513499596621286 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10407135199844923, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012739274090963085 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1756629066815182, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.001920166706499377 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12039709037310402, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012183558463707484 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13389561548404935, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017270516951590925 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.21986093946231267, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023909852118580966 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15379828585730648, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016655511240505972 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.329387173898731, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.050959742820502744 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e3d7bdac349fec345286d6e71c79a742a153f3c1 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1457832945742694, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019709762483393995 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.23637305672174788, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00247992475878217 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16632065161606457, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018066810527815245 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.025484778469339338, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007890273465689312 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04140023492730905, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012184459681475824 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.028604389417761292, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007628849403399381 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10769050653186357, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013738979743412702 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1810403836066358, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019346598459529787 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1241823537201758, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012458496339153408 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1369600906660757, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018450558019738083 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.22309275958929797, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00234205408760469 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15640138097648992, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016797214333223785 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.4424517914266726, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07020911999324617 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d8cf49b1470796da728ceaeff0d555d3b265a106 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.12998655695663616, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002189516833129907 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.20496486516154497, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028659172041743037 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.143979322470228, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020322874462190108 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.02321033760008198, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007517668617932092 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.03739800165990479, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012436961876240002 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.025681636061568994, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007575885700225844 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.09639136628498862, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015654498649897994 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.15704796853631195, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002245229184123941 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.10744111532164179, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014289232021387648 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.12253923603559544, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020589899658542553 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.19382819078757685, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027171877182869237 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.13580783797212667, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019069485763797925 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.6327965384480934, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04784558757070599 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0ab778ffb539c3847b4d50892389c31042a5a8f3 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.046448930876018805, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018035348802430623 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07357293605788026, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025697179083559174 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.04993869263777386, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017400482796179053 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.009115547013068444, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007080420784229646 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.014379490534632422, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0008642671865072303 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.009405169337583598, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0005257744049594801 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.03565948935943829, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013979177010115587 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.057422168791446994, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020177366914654244 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.038166867834712785, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012986554235132886 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.04362589861222556, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016994783987957273 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.06935466728288939, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002427541920224267 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.0469149420555244, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016335234715811244 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.3975830375151671, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03517002110590927 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..4f8da8f596ee464584b97ad2ecc9404c9de05e7c --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.007172892267383475, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0007917929568286087 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.011671122997395015, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0011606516791878689 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.007568370913695297, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0007491159620591852 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.001264178384729475, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0001966473650926985 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0024796221258986603, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004192114120392164 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0013965027873250944, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00020572985862442358 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.005490417768289501, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0005849801172714558 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.009413328535258628, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009398460308935353 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.005865552021821947, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0005564517319441601 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.006712756393605032, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007345666949798625 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.010998399946717396, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0010932046581100556 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.007131866271390784, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007049678056309991 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 6.239939007315392e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 9.71466408645211e-07 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..5552ff1de54082d910a764946bbd68b68797118a --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.9812514400249457, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.05562262752722095 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.15847815457785414, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.004328803941964481 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.12742700108402852, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0023559640853185737 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.10900954926081764, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020004132814706306 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.07159611132449242, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0037286287454660018 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.028548308692682663, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0008068071456433969 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.027201662156796255, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.000788791139157471 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.1334388407711523, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003974193073139387 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.10337061722487395, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0018911584688758604 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.08788250933957609, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015590214437749034 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.14150177498276953, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.004129595856079377 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.10875548432324901, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002033382683937447 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.09356044304033936, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001722161996359038 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..256a9f3847ba1197a702c179f0aded80e01c5857 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.2253192440366405, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.07140167205007719 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3815177071515503, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.005218371241177884 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.3106318538579719, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0031963478818675803 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.26325944037191484, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022748072352886776 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.20178279286083556, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.005294112759514037 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.11654879964306347, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001824032288290023 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.10002146341400579, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014693572942374512 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.324114703856428, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.005097258650525136 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2500017558247758, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025922878822160645 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2113652311205057, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017419352055642414 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3390145444380815, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.005172645689386997 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.26174975224096514, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002787496997673839 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.22354194196380525, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019987653462617975 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c9a66d6fb1a6c6c48cd344ba5a17f849491f10ce --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.968462167589187, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.0809413455934123 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.37561041209802154, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.004803576540487985 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.34542246645230873, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028469806255225247 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.29114774014783334, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021518045305416187 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.18697031703703257, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.004365267354030048 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.13946536473639037, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0018038930024966585 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.11837013500076157, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014809679532815788 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.315951536990457, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.004519636510616847 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2848990694431196, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024528350275542597 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2378485997813391, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017083954437583943 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.32795875851147216, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.004687306327421472 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.29047623226002345, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025636131138164543 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.24624266553405377, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001958228700135443 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1c28972af0dc2faf91095d00c3b41d88dd99a134 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.100413535925033, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.10204084214961892 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.35577144203191385, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.004537003722998761 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.3647244934358361, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002747523679173933 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.29715275676346536, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020593689131373845 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.17035987156923135, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0038407536951717567 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.15028814529506035, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0018136946483250282 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.12236707177425063, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001437321932186944 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.29603811661828844, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.004152196775629119 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3006722948935132, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023586910132368166 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.24251170955511187, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016065436945657693 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.30701171887463186, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0043364855185944965 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.30602796565632656, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0024654434831691296 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2502378170722232, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018582144974208202 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f978ed1c2dd3bac92990c2cc04284af5bc2c862c --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.302528506929725, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.09159160557761398 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3457184925802193, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.004160231582604038 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.38873799656965313, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002639030454229803 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3106389862425593, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019745864967604964 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.1613981344463189, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0034319902981585207 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.16100746129847524, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0017978172805353685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.12862161964342028, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001433312603510002 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.28411370893647675, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.003743798776985757 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.319390176337282, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023152107019332466 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.25227586868839813, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001559219635105758 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2963124375137464, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003972319515480073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.32622007058557423, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002450252978851981 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.26125127654019925, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018446022776906345 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..021a5b6fe66d6ad2be48b18e6bcda2729e74cf4d --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.2420502388251435, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.11069521906199865 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.31078931466957455, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0035821838565772805 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.40928814978401035, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002513611780694676 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.31044786268293756, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001944681263041426 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.13661422794726982, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.00268531843352623 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.17131478141957424, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001846264774766135 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.12861734204623188, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014302618265553057 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2514460944139299, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0030526186239578533 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3356791583944898, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002240539567274668 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2510224592044638, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015295416689170924 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.26462055977448007, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003336730030918389 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3452406840839544, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0023886668900561766 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2617560668553504, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001820974367559263 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_0.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a81f51fd35836dea362bd0182dfadb38a303d149 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.16316619187689388, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002890984890147137 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.31001559634568143, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003978659821378838 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20008656508370964, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002602919942357546 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03352547525672803, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0014320698536196147 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06430340976455366, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00231938341604023 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04090748442736069, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014928104681925642 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12270675062564947, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0022927482127938856 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2338821411106156, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0031011088285461284 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1502142949913443, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020028080134693966 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12803202942224567, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002326732638749928 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24656433036848785, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003410843786433149 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15761386746032657, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021239498717418375 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4539286316534636, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10413341300371938 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_1.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ee01969f2750e708cfcf4aa8d28f8bf0f79e4afb --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11453236899619632, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0016195986503994135 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2802645254992808, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003696829148468212 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.16026754839725937, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002152722052964271 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01742972704474614, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008103528180574307 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.04404260214452908, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0020813739232181275 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.024638353865890434, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0011382421012757812 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08816027894258283, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0012193640200953474 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.21709258927943814, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002827223535684834 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12352821757343255, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016133160942209523 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0920451713692867, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0013155981196239118 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2271186416361983, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003132670977496884 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12904870256695447, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017598213737764256 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.9965190176386574, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.05559453420420461 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_2.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5faea469488228f2fa0871a43dd67d9944accfac --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11145983804593526, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0014743643800890196 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.28045679367482057, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0034259770552426184 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.15769070631922, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.001982981910213691 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.015152005516530816, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006754060180232467 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.039166379272577614, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0017988727907617531 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.021605793985650032, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009634567881537258 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08486603983815774, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001085791049406374 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.21516366945216606, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0026703236853124913 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12029157280634108, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001476371836829727 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0901270375976316, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0012216984674086196 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2285463112828528, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.002980474602095322 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12777306089054677, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0016653146013723525 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.8252686451228434, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06219441463160752 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_3.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..21e241351aae6bb8ce32ac84b658c6b305ea326d --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1078263305297306, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017542085299995392 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2580253690370548, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0037660524996162735 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.14870537856013735, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022250373297856207 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.014571709458807564, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007101227457714503 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.03574556425775684, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0017388222484751564 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.020403012896272645, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009871637156077466 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08197966655283043, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001292307383970243 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.1974050382443013, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0028035058486686956 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11315310318316395, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016139643872092233 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08677115079741256, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001375140243984192 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20995584785478394, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0031091921366029267 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12007749682129613, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017680042779764178 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.8113683570520359, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06619825265722147 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_4.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5adf4ab6bbf68330b65c444b66330ec4ca3bda0a --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.03418472303276383, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.00210110351555125 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.06304793651249774, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0035973524455498603 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04010781297274983, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022481684730005936 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.004145873623694822, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0005061006325311766 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.008843875903750643, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0010081977796634128 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00536187053653973, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0006114168649663856 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.027278513716520444, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017455746766801424 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.04970336071033803, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002848378744916723 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03144663530333203, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017459513025573287 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.02813790632578131, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0018032712966730017 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.05107839677205752, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0029256027588574272 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03239030933843817, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018053015484972615 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.4568380418312376, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11240957017003458 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_5.json b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..76ea03da6476841ff1361a02805d2b4380bc5e66 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/generation/slim.4b284b1b9c4seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0019374196381469005, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0005297555109388115 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0017199042758875617, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0004699087955021987 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0017758047725847756, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0004794001433637215 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0016417177155976152, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0004455222998055521 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0014066712761193988, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0003697747285853825 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0014811178551071952, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00039295568397820974 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0017493422405362358, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0004643643474163307 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0015674774510765171, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00042362427764150467 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0016076723854203951, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0004229539683443897 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.2435863834999107e-38, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.6010999120135594e-32 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_0.csv b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..aec18774db17d8ace5475636681643c2373a617f --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.337,0.014955087918653598,0 +anli_r2,acc,0.34,0.014987482264363935,0 +anli_r3,acc,0.36,0.013862183574189902,0 +arc_challenge,acc,0.2363481228668942,0.012414960524301846,0 +arc_challenge,acc_norm,0.26791808873720135,0.01294203019513644,0 +arc_easy,acc,0.49747474747474746,0.010259652668783469,0 +arc_easy,acc_norm,0.45202020202020204,0.010212436978834111,0 +boolq,acc,0.4801223241590214,0.00873814151648864,1 +cb,acc,0.5357142857142857,0.06724777654937658,1 +cb,f1,0.35972850678733037,,1 +copa,acc,0.67,0.047258156262526066,0 +hellaswag,acc,0.3857797251543517,0.004857840934549165,0 +hellaswag,acc_norm,0.4766978689504083,0.004984359669951926,0 +piqa,acc,0.705114254624592,0.010639030620157003,0 +piqa,acc_norm,0.6985854189336235,0.01070624824275376,0 +rte,acc,0.5234657039711191,0.03006330041190266,0 +sciq,acc,0.717,0.014251810906481754,0 +sciq,acc_norm,0.646,0.015129868238451773,0 +storycloze_2016,acc,0.6568679850347408,0.010978648097499879,0 +winogrande,acc,0.5193370165745856,0.01404197273371297,0 diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_0.json b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_0.json new file mode 100644 index 0000000000000000000000000000000000000000..690901e5713243ef7b475cf0127b0c9a9244cd12 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.014955087918653598 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363935 + }, + "anli_r3": { + "acc": 0.36, + "acc_stderr": 0.013862183574189902 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.35972850678733037 + }, + "copa": { + "acc": 0.67, + "acc_stderr": 0.047258156262526066 + }, + "hellaswag": { + "acc": 0.3857797251543517, + "acc_stderr": 0.004857840934549165, + "acc_norm": 0.4766978689504083, + "acc_norm_stderr": 0.004984359669951926 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5193370165745856, + "acc_stderr": 0.01404197273371297 + }, + "storycloze_2016": { + "acc": 0.6568679850347408, + "acc_stderr": 0.010978648097499879 + }, + "boolq": { + "acc": 0.4801223241590214, + "acc_stderr": 0.00873814151648864 + }, + "arc_easy": { + "acc": 0.49747474747474746, + "acc_stderr": 0.010259652668783469, + "acc_norm": 0.45202020202020204, + "acc_norm_stderr": 0.010212436978834111 + }, + "arc_challenge": { + "acc": 0.2363481228668942, + "acc_stderr": 0.012414960524301846, + "acc_norm": 0.26791808873720135, + "acc_norm_stderr": 0.01294203019513644 + }, + "sciq": { + "acc": 0.717, + "acc_stderr": 0.014251810906481754, + "acc_norm": 0.646, + "acc_norm_stderr": 0.015129868238451773 + }, + "piqa": { + "acc": 0.705114254624592, + "acc_stderr": 0.010639030620157003, + "acc_norm": 0.6985854189336235, + "acc_norm_stderr": 0.01070624824275376 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_1.csv b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..ae15fa98eafa0b71befa88f8734129fe2b7ffc5c --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.323,0.014794927843348633,0 +anli_r2,acc,0.364,0.015222868840522024,0 +anli_r3,acc,0.3375,0.013655897185463655,0 +arc_challenge,acc,0.23976109215017063,0.012476304127453947,0 +arc_challenge,acc_norm,0.257679180887372,0.0127807705627684,0 +arc_easy,acc,0.5071548821548821,0.01025873302244637,0 +arc_easy,acc_norm,0.4650673400673401,0.010234713052723658,0 +boolq,acc,0.5,0.008745054976398168,1 +cb,acc,0.5178571428571429,0.06737697508644648,1 +cb,f1,0.3525733525733525,,1 +copa,acc,0.65,0.047937248544110196,0 +hellaswag,acc,0.3941445927106154,0.004876674814874709,0 +hellaswag,acc_norm,0.48645688109938257,0.004987950663406552,0 +piqa,acc,0.7023939064200218,0.010667353792388213,0 +piqa,acc_norm,0.7002176278563657,0.01068968696713809,0 +rte,acc,0.51985559566787,0.030072723167317177,0 +sciq,acc,0.735,0.013963164754809946,0 +sciq,acc_norm,0.705,0.014428554438445517,0 +storycloze_2016,acc,0.6424371993586317,0.011083341168827792,0 +winogrande,acc,0.5138121546961326,0.014047122916440412,0 diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_1.json b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1ce275822c383979695d05456d9f62a7ca8b95c5 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.323, + "acc_stderr": 0.014794927843348633 + }, + "anli_r2": { + "acc": 0.364, + "acc_stderr": 0.015222868840522024 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463655 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.3525733525733525 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.047937248544110196 + }, + "hellaswag": { + "acc": 0.3941445927106154, + "acc_stderr": 0.004876674814874709, + "acc_norm": 0.48645688109938257, + "acc_norm_stderr": 0.004987950663406552 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.5138121546961326, + "acc_stderr": 0.014047122916440412 + }, + "storycloze_2016": { + "acc": 0.6424371993586317, + "acc_stderr": 0.011083341168827792 + }, + "boolq": { + "acc": 0.5, + "acc_stderr": 0.008745054976398168 + }, + "arc_easy": { + "acc": 0.5071548821548821, + "acc_stderr": 0.01025873302244637, + "acc_norm": 0.4650673400673401, + "acc_norm_stderr": 0.010234713052723658 + }, + "arc_challenge": { + "acc": 0.23976109215017063, + "acc_stderr": 0.012476304127453947, + "acc_norm": 0.257679180887372, + "acc_norm_stderr": 0.0127807705627684 + }, + "sciq": { + "acc": 0.735, + "acc_stderr": 0.013963164754809946, + "acc_norm": 0.705, + "acc_norm_stderr": 0.014428554438445517 + }, + "piqa": { + "acc": 0.7023939064200218, + "acc_stderr": 0.010667353792388213, + "acc_norm": 0.7002176278563657, + "acc_norm_stderr": 0.01068968696713809 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_2.csv b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..ee27741a51181f3c259da56c7e2b46f0867247fd --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.338,0.014965960710224482,0 +anli_r2,acc,0.371,0.015283736211823188,0 +anli_r3,acc,0.3416666666666667,0.013696658778002514,0 +arc_challenge,acc,0.23976109215017063,0.012476304127453946,0 +arc_challenge,acc_norm,0.26706484641638223,0.012928933196496352,0 +arc_easy,acc,0.49284511784511786,0.01025873302244637,0 +arc_easy,acc_norm,0.47685185185185186,0.010248782484554474,0 +boolq,acc,0.5137614678899083,0.008741742106878655,1 +cb,acc,0.5,0.06741998624632421,1 +cb,f1,0.3419913419913419,,1 +copa,acc,0.65,0.047937248544110196,0 +hellaswag,acc,0.3921529575781717,0.004872326888655522,0 +hellaswag,acc_norm,0.4898426608245369,0.004988751698341149,0 +piqa,acc,0.705658324265506,0.0106333114703475,0 +piqa,acc_norm,0.7040261153427638,0.010650414317148131,0 +rte,acc,0.5776173285198556,0.029731622646495887,0 +sciq,acc,0.749,0.013718133516888923,0 +sciq,acc_norm,0.74,0.013877773329774166,0 +storycloze_2016,acc,0.6467129877071085,0.011053474766125627,0 +winogrande,acc,0.5209155485398579,0.014040185494212949,0 diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_2.json b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d02f632be238325f640f1b7fe4ad23e7e4f438b0 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.338, + "acc_stderr": 0.014965960710224482 + }, + "anli_r2": { + "acc": 0.371, + "acc_stderr": 0.015283736211823188 + }, + "anli_r3": { + "acc": 0.3416666666666667, + "acc_stderr": 0.013696658778002514 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.3419913419913419 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.047937248544110196 + }, + "hellaswag": { + "acc": 0.3921529575781717, + "acc_stderr": 0.004872326888655522, + "acc_norm": 0.4898426608245369, + "acc_norm_stderr": 0.004988751698341149 + }, + "rte": { + "acc": 0.5776173285198556, + "acc_stderr": 0.029731622646495887 + }, + "winogrande": { + "acc": 0.5209155485398579, + "acc_stderr": 0.014040185494212949 + }, + "storycloze_2016": { + "acc": 0.6467129877071085, + "acc_stderr": 0.011053474766125627 + }, + "boolq": { + "acc": 0.5137614678899083, + "acc_stderr": 0.008741742106878655 + }, + "arc_easy": { + "acc": 0.49284511784511786, + "acc_stderr": 0.01025873302244637, + "acc_norm": 0.47685185185185186, + "acc_norm_stderr": 0.010248782484554474 + }, + "arc_challenge": { + "acc": 0.23976109215017063, + "acc_stderr": 0.012476304127453946, + "acc_norm": 0.26706484641638223, + "acc_norm_stderr": 0.012928933196496352 + }, + "sciq": { + "acc": 0.749, + "acc_stderr": 0.013718133516888923, + "acc_norm": 0.74, + "acc_norm_stderr": 0.013877773329774166 + }, + "piqa": { + "acc": 0.705658324265506, + "acc_stderr": 0.0106333114703475, + "acc_norm": 0.7040261153427638, + "acc_norm_stderr": 0.010650414317148131 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_3.csv b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..c5794254b8de3239a57930cc5a49cce405082ab9 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.349,0.015080663991563097,0 +anli_r2,acc,0.359,0.015177264224798596,0 +anli_r3,acc,0.365,0.01390348598141358,0 +arc_challenge,acc,0.23122866894197952,0.01232085883477228,0 +arc_challenge,acc_norm,0.257679180887372,0.0127807705627684,0 +arc_easy,acc,0.4890572390572391,0.010257326131172879,0 +arc_easy,acc_norm,0.4701178451178451,0.01024144432288643,0 +boolq,acc,0.5336391437308868,0.00872524086113114,1 +cb,acc,0.5178571428571429,0.06737697508644648,1 +cb,f1,0.327692720923986,,1 +copa,acc,0.67,0.04725815626252607,0 +hellaswag,acc,0.39404501095399325,0.004876459434619795,0 +hellaswag,acc_norm,0.4907388966341366,0.0049889254105227685,0 +piqa,acc,0.6920565832426551,0.010770892367463685,0 +piqa,acc_norm,0.705658324265506,0.01063331147034751,0 +rte,acc,0.5234657039711191,0.03006330041190266,0 +sciq,acc,0.756,0.013588548437881423,0 +sciq,acc_norm,0.734,0.013979965645145143,0 +storycloze_2016,acc,0.6445750935328701,0.011068528452399879,0 +winogrande,acc,0.5098658247829518,0.014049749833367592,0 diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_3.json b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ccd53a8f2ea4ac7ecae2d1fddac0e0095ed6704a --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.349, + "acc_stderr": 0.015080663991563097 + }, + "anli_r2": { + "acc": 0.359, + "acc_stderr": 0.015177264224798596 + }, + "anli_r3": { + "acc": 0.365, + "acc_stderr": 0.01390348598141358 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.327692720923986 + }, + "copa": { + "acc": 0.67, + "acc_stderr": 0.04725815626252607 + }, + "hellaswag": { + "acc": 0.39404501095399325, + "acc_stderr": 0.004876459434619795, + "acc_norm": 0.4907388966341366, + "acc_norm_stderr": 0.0049889254105227685 + }, + "rte": { + "acc": 0.5234657039711191, + "acc_stderr": 0.03006330041190266 + }, + "winogrande": { + "acc": 0.5098658247829518, + "acc_stderr": 0.014049749833367592 + }, + "storycloze_2016": { + "acc": 0.6445750935328701, + "acc_stderr": 0.011068528452399879 + }, + "boolq": { + "acc": 0.5336391437308868, + "acc_stderr": 0.00872524086113114 + }, + "arc_easy": { + "acc": 0.4890572390572391, + "acc_stderr": 0.010257326131172879, + "acc_norm": 0.4701178451178451, + "acc_norm_stderr": 0.01024144432288643 + }, + "arc_challenge": { + "acc": 0.23122866894197952, + "acc_stderr": 0.01232085883477228, + "acc_norm": 0.257679180887372, + "acc_norm_stderr": 0.0127807705627684 + }, + "sciq": { + "acc": 0.756, + "acc_stderr": 0.013588548437881423, + "acc_norm": 0.734, + "acc_norm_stderr": 0.013979965645145143 + }, + "piqa": { + "acc": 0.6920565832426551, + "acc_stderr": 0.010770892367463685, + "acc_norm": 0.705658324265506, + "acc_norm_stderr": 0.01063331147034751 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_4.csv b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..f899e9368b22e5ff32290ad59e8eb62d49fc245e --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.356,0.01514904265930663,0 +anli_r2,acc,0.363,0.015213890444671285,0 +anli_r3,acc,0.3625,0.01388303787422552,0 +arc_challenge,acc,0.2363481228668942,0.012414960524301836,0 +arc_challenge,acc_norm,0.26706484641638223,0.012928933196496357,0 +arc_easy,acc,0.4852693602693603,0.010255329977562098,0 +arc_easy,acc_norm,0.47769360269360267,0.01024956840455565,0 +boolq,acc,0.5339449541284403,0.008724878548525217,1 +cb,acc,0.5,0.06741998624632421,1 +cb,f1,0.3261261261261261,,1 +copa,acc,0.65,0.047937248544110196,0 +hellaswag,acc,0.39075881298546106,0.0048692327581033226,0 +hellaswag,acc_norm,0.4880501892053376,0.004988356146499007,0 +piqa,acc,0.6996735582154516,0.010695225308183133,0 +piqa,acc_norm,0.6926006528835691,0.010765602506939061,0 +rte,acc,0.5090252707581228,0.030091559826331334,0 +sciq,acc,0.763,0.01345407046257795,0 +sciq,acc_norm,0.733,0.013996674851796275,0 +storycloze_2016,acc,0.6461785141635489,0.011057260832171067,0 +winogrande,acc,0.5153906866614049,0.014045826789783663,0 diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_4.json b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_4.json new file mode 100644 index 0000000000000000000000000000000000000000..2ec9c28ce00a442824a9847009d0a9ac04297b80 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.356, + "acc_stderr": 0.01514904265930663 + }, + "anli_r2": { + "acc": 0.363, + "acc_stderr": 0.015213890444671285 + }, + "anli_r3": { + "acc": 0.3625, + "acc_stderr": 0.01388303787422552 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.3261261261261261 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.047937248544110196 + }, + "hellaswag": { + "acc": 0.39075881298546106, + "acc_stderr": 0.0048692327581033226, + "acc_norm": 0.4880501892053376, + "acc_norm_stderr": 0.004988356146499007 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5153906866614049, + "acc_stderr": 0.014045826789783663 + }, + "storycloze_2016": { + "acc": 0.6461785141635489, + "acc_stderr": 0.011057260832171067 + }, + "boolq": { + "acc": 0.5339449541284403, + "acc_stderr": 0.008724878548525217 + }, + "arc_easy": { + "acc": 0.4852693602693603, + "acc_stderr": 0.010255329977562098, + "acc_norm": 0.47769360269360267, + "acc_norm_stderr": 0.01024956840455565 + }, + "arc_challenge": { + "acc": 0.2363481228668942, + "acc_stderr": 0.012414960524301836, + "acc_norm": 0.26706484641638223, + "acc_norm_stderr": 0.012928933196496357 + }, + "sciq": { + "acc": 0.763, + "acc_stderr": 0.01345407046257795, + "acc_norm": 0.733, + "acc_norm_stderr": 0.013996674851796275 + }, + "piqa": { + "acc": 0.6996735582154516, + "acc_stderr": 0.010695225308183133, + "acc_norm": 0.6926006528835691, + "acc_norm_stderr": 0.010765602506939061 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_5.csv b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..36cdf43b0b71f617c17f93a9d4dba2b751de2cdb --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.364,0.01522286884052202,0 +anli_r2,acc,0.348,0.01507060460376841,0 +anli_r3,acc,0.3566666666666667,0.013833742805050715,0 +arc_challenge,acc,0.2363481228668942,0.012414960524301842,0 +arc_challenge,acc_norm,0.2696245733788396,0.012968040686869148,0 +arc_easy,acc,0.4831649831649832,0.010253966261288895,0 +arc_easy,acc_norm,0.4734848484848485,0.010245347015573706,0 +boolq,acc,0.537308868501529,0.00872067560638845,1 +cb,acc,0.5357142857142857,0.06724777654937658,1 +cb,f1,0.3263888888888889,,1 +copa,acc,0.64,0.04824181513244218,0 +hellaswag,acc,0.3935471021708823,0.004875379352079819,0 +hellaswag,acc_norm,0.4924317864967138,0.00498920977074323,0 +piqa,acc,0.7007616974972797,0.01068413067313458,0 +piqa,acc_norm,0.6931447225244831,0.010760295070580381,0 +rte,acc,0.5667870036101083,0.029826764082138277,0 +sciq,acc,0.761,0.013493000446937587,0 +sciq,acc_norm,0.749,0.01371813351688892,0 +storycloze_2016,acc,0.6493853554249065,0.011034317290463294,0 +winogrande,acc,0.5153906866614049,0.01404582678978366,0 diff --git a/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_5.json b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_5.json new file mode 100644 index 0000000000000000000000000000000000000000..ebb6e324934445ccc69b61aa3b25f2305d745da3 --- /dev/null +++ b/4b284b1b9c4seed2/evaluation/rankeval/4b284b1b9c4seed2_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.364, + "acc_stderr": 0.01522286884052202 + }, + "anli_r2": { + "acc": 0.348, + "acc_stderr": 0.01507060460376841 + }, + "anli_r3": { + "acc": 0.3566666666666667, + "acc_stderr": 0.013833742805050715 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.3263888888888889 + }, + "copa": { + "acc": 0.64, + "acc_stderr": 0.04824181513244218 + }, + "hellaswag": { + "acc": 0.3935471021708823, + "acc_stderr": 0.004875379352079819, + "acc_norm": 0.4924317864967138, + "acc_norm_stderr": 0.00498920977074323 + }, + "rte": { + "acc": 0.5667870036101083, + "acc_stderr": 0.029826764082138277 + }, + "winogrande": { + "acc": 0.5153906866614049, + "acc_stderr": 0.01404582678978366 + }, + "storycloze_2016": { + "acc": 0.6493853554249065, + "acc_stderr": 0.011034317290463294 + }, + "boolq": { + "acc": 0.537308868501529, + "acc_stderr": 0.00872067560638845 + }, + "arc_easy": { + "acc": 0.4831649831649832, + "acc_stderr": 0.010253966261288895, + "acc_norm": 0.4734848484848485, + "acc_norm_stderr": 0.010245347015573706 + }, + "arc_challenge": { + "acc": 0.2363481228668942, + "acc_stderr": 0.012414960524301842, + "acc_norm": 0.2696245733788396, + "acc_norm_stderr": 0.012968040686869148 + }, + "sciq": { + "acc": 0.761, + "acc_stderr": 0.013493000446937587, + "acc_norm": 0.749, + "acc_norm_stderr": 0.01371813351688892 + }, + "piqa": { + "acc": 0.7007616974972797, + "acc_stderr": 0.01068413067313458, + "acc_norm": 0.6931447225244831, + "acc_norm_stderr": 0.010760295070580381 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f87c6741a9890eaa10f9abe42b4d49fe0938d23 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:714f22235056b85f66c2d163cbecc7cb0cc7b3a2f9dcee7047418fdc9ba68b3a +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3123ee37c674dbde5a53efcbf3c2dd4c5c36b558 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca6d15018448635c761f050c60a024ba7c31a640c76327a7bab6287ab392510a +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..645b19e9c0ee32d77b6043756c15ce7b47cd2c2c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:89ccaaf180334848266b7c1d0396c60713da1fb91d717db780d4303ce75a40bb +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b03dfe6f09599fdc08369618b7e7a6cd0e5660c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e92ffb41a767a8235385ff425c907651ab0696906574f1e018009a36ec578b32 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f81966bf280bcec6194cea11f75cca9f762973cc --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af176695ca7f377cf090a73274d4a97c8bf191fb5934e24337887bc720abd624 +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dae0866024210d8777c01760cd76a9bd756bf2d3 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a83bbd615ca8b78623b2e89594496c9633329e6d985c6183b04bf2273d7f3111 +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..770871c8aeae670a7a539a3c65dec436a271e3f6 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d40835bf02a6d171d04c7af942ddc870158c7a7d3aa4249016519ae6ba3bfba3 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c516937116a0d6fe4342208dc32f0226c691bfe7 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f74aa18643457ca2c732f30e2c3b8044ecae2c12a172486406e88cbe305e9082 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b727b287260234aadedee0aa7ef66244d8e34ec8 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978226cd59afa7fb11db47d9168096c490750175129f3a9860bf867b55a35d3a +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..100246cf49baecdf9d2be5597b53baa98e2c6b06 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2096405a0ae8dc9188944138e59e21f7263618708266a886e91eada2aa0f130 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e24e6c7770833c85ccc207695e34613ac271926 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5b2f7c99ed2c6f1da9e5ebde0c0843a13179537c08ee41da47e27b4e804845 +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f8d5bd60bc9e19611c32bf77f299ed2077b2e85 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00fbcc8ab59076d1cb59efdfb10500995b0090894ada4cd03652fd5dda1aa291 +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb16f50b757d6bb13bd8b89d26a22eb4bd712925 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eb5893a3e80fc16a29e95351a302fda809d9084a9bc81a467b23a896e6e673c +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..044541e5b7f3528d3cf7650040bc1c79557f678a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd5c5e13b24627c4bef4242273603ec87d93a61a3cace12fa60593c39af1ac36 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..197f8cf741fee168406c0320bafdd64dae90411d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfc88f0c2ed04a441a0ed51f324a4786e1afe0c08be84e24a073415edabd04bf +size 199058669 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f11a4bca2ab500f940b74f86fde46d241f42ada --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10e16adc9075129d2bcc3fb4bed125356d5fb558af2c6bf76822fccc11327e3e +size 199058669 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2db1a836a7d58121fe24d572bb85e8f83063845d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91576b190a892eeaf41bf2805335c93cbf4c8ae6d8f9685585e85525ba317a0e +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a53547b68720378c97c25977d02d47b76bb7c18f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75d96f8cab5bb76a004de01faca63e743edf6099b4b8219f007aec1d839ffd7 +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e66315469212770f379c95288d3992064052d11 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c974fade5293fb148db159390472c3a296077fac7d76286ea423d61309be89e5 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ae6b41ae8bbd5fa820e7580fb6258bbeec16662 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25a73541bbf5cdc6c54899bef48a28daa00ecca8e349462e505d91cccfc2b03b +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e58eb8e21660e25e745686c0e7d33c32f9531074 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0c9e5e1012776cfee031377f3303a9659a85ca90c0144bc1ee6d12ef9bb9779 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca417acb710fef2ca8a016c8fc48f2ae1bef1508 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca38db75529b43836b728ce5dc510eed45ed78e533e4388592319d3b241725b0 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f7295ea782fd8dd30e111e72517dd3641fce422 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a61e7075198707fff7a8cef4145cadb8748f7296876b8a97a9c11dd4317a87a6 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fde3ce009d7d5dcfbf4888445b7494a9791345a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7dbe989df6fcad79a08077aef1f608cda776a463cffdee4928757207c2bdbd3 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e21820475e877d693982394785950f935dec6a48 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26ac3d6a2e19442dba53dc33c359c6ce4021af42f44afad7969dff27b6f3d74f +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30aed4180d790ebc36f4dae59611e559e3469346 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7f7ca43ad8b3d1dc962d2e80d4f3ea9fed8f2ad12f72e5b93e8cea17df8b71d +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c777bd51897b6fbf10ca651d5620c3655f891b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7184ab95f210462aa511f5dfa765895d3dd09c0736f9e90f152f3b8a76f0a14e +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..533af470e7031685952e4af1e355667684a1490c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ba2ec7666698fd136490fa497ad3355e586e1303bba4d01f62fdb6d181a90ef +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63d8691e0e55f3c779846159769a6f70663130ef --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a04686bb673ae3dd30f45222213477646aa100cce3df8bc7c7f2dfb1c495775c +size 199058605 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebcebf057cf6353432a9fe23daf4a4fa6a49f462 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90fab4aff8e2d5b0a249b9d80a1b1a5f7b105b5a6bd5686e85aeb1b54c50dc93 +size 199058605 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5b3df7e5e01586932e64fc32bf8b9ad869b3db0 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97fe7cc5d5dce56e8096ee721b9f9ed33c53fdee25389885a019673e4a4d6ae0 +size 199058669 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dfbe39e581573da982491f94144920eabd291cd5 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72788296a74e50f6007b7ef3e402d8849fb619810b1b511523f86daf5e22222c +size 199058669 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4ef8707e4dcc7c64e0cee382416099d6c9c3d50 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fd14c60333e7863bde60da0bc94a751dd881ddfe685c1c7a02026e5d4522a0e +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfda4ad77b7206b5a696130c40b0092bf1d820c5 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c92f6483dabc8dc9346ca1592dfb63ec1f3f99b350324b1eeba36c2a2113a14a +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1a89024a49238ba204aa79a87c50980eae9cc4b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:262d41acf25be31714c276cf7a6965b06dd1faad79ae27cdd5f9a53cca0817b8 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff22db6977a14e400770c298fd7cdd1e578825aa --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:053b57b04b00b1d5a5f9e4a6e7953c02df5f53116358e7d52df593c6a280b4b9 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc7c867c5dd92787e3b8333848b5aafd680e3ed5 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9591cd3f2b294e4de41ab3fd83e636d8e9647e2853850f6f0866e8c02951c65e +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..df0f5ecdf47e9107f3bff688c044c20822ad6b29 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d43dfb8d575ee8927663347e3ac09717d3e2dfa3d91883b7bbf709ef94e16a78 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e5415b3e841fa4d12d87bd3f4dded82dbd84444 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4493f9496070fca80084750b098be7db198bb2ad6661d444a4ec4b70bd1ba2c8 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d1aa358bfa287568dc75c5a7296fd2226f0fc2b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8054e6092eca68e80d34e25184d2755cb04db9d1d7b188c9968414ab3e03b30d +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a0c794256903fabe6e5318e8bf2745c63b33b3e --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc68d7e98abc768152768c7e524846d7a324d5e6ed78ddcc0b8090991c3ad4d1 +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8304256c600368a3c86e86494e3d33ce6f4b979a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56c931a92636b4798a83c5f7c2c11a3cd6cd0b9414f887c4ec8e5e559844ab07 +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2eb66f180deda166d0151a15f3dedc0c8a5659f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e363f41d81cf4eeb5fc4b3c4c94cc93b4994ff7b7a68f605bb6ab762eb69ebc1 +size 199058669 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b1ff0aba35a199223e91bb3fb1d64219e0dedd7 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbe7d3ee06a6c8a74e82f64a389c80d943622f67cb0202ba99b4e52c73bed4fa +size 199058669 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a7d19ecf418f3ac235460f41afde06817ff6b51 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52fdbaf723b68ede35f5c1ebfaf4ad8f36a314efba44323941757f1938863bb5 +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73fd2a074b186d6953f78abda16cb174b6a69aad --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fa232575268b608f1d580e4159505798bf1ad92e2552b7b657db085271699b8 +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2558997c567487975575cefb2c289b286b9aec0f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9c13773e1944420f5892c64c0fec50b0a0597f2df7056fcb64801a1df185bfc +size 199058669 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce0cffc66cc61a3732a793cee046538a67d7497b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2618d605eaef1933959087f7d053e2aa9571a65d0d5af70e295e7bca9457c87b +size 199058669 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..260cb4ad44aef7c074daa3a91d8acab8ac214647 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09e0e498267f6bd7e22b2e13aa534997161a8351fbb37dc3e8641cd76e262b8b +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f929dce2b95048074e5984750daec0f2ef890a81 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aa8d5a9661ea26f9d7a7ee5e28ac43290cc9b057170ab2e810474dabbb63761 +size 199058797 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bab21ecc2206394f71511935ed257ab20f594eed --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bbfa0adfbc4adedf14e9437bc65049faeabd158c862bd20cd79ab8ce2fb536d +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f58decac252a6c707940b93675b033b27d33c7da --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ad8375bae832e29ae557813f4d5b7f3f62d9372b1f86e77b24e44c952bae33e +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30405059903c8968735ac37a62a61b60dd417149 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bca43bf9260dd2d4e09cbf4b2aa5650cedefc4cf50d80fc11d3ba1014e30536 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43a0b509b7300c5da41899a77e33e72a362d4f83 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14c1a8c35067ecbddf3f64c6a32e533de8563b8df4e060c8bbbf7843e70b8738 +size 199058733 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b521f7d65f55e7debdc06cfd4f89a3f466a6f28 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:083e73b1e6ac10b8714d4f34e201aa12deba924fdf564c9d9fc98b48fdbf5338 +size 199058669 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f33df540a2adfcae2cf0494f3c1200a2f5db35ae --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cce2ad11c856c058b7eef85c496d55e990ccb68c223514dbe96d2564e8f632d7 +size 199058669 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a784169de9ffc9baf4b755b15bcae67399127f8d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f281ba937423f19414c4b64e978c85558ec46f166e39f004f8a9f0a31b554bd +size 199058925 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3e33a59a91a53bf92b2b3cf3a2a9ef840774372 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbb8a2bce52894485bdf9f326140df53a3e22db9a32d71321f12fa3e091f5a73 +size 199058925 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e7ab1791d2d4f7cbd6d1017b364cbc7319e317e --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c271f0bb10357183dbcc6ba9eeeb3854d6b13f8a1e8aea9c046187c71bde1feb +size 199058605 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37fa0c2d8211373d6c56cbb61fc1db6f155a182a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe2f354892a55324b2a436bcc57ed7a802d9d09674a25f3c6c52798374272003 +size 199058605 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77c5e07d312be746299dce87c0367a16a5845b3a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ad9337391d4c8f3d854b8f3280910d889c71d280a1d2fe17360a314e807de09 +size 199058605 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1475845c24d7f4946abc0f755d1cf79aeb489c71 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bd18f2b8d9212547a72febdb3802dcb3e0ae7bee86d2bd5d28dad7960106239 +size 199058605 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77a127a87aa9d86f7d41fb5632312bd891beaca7 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7389ec669fe74878bc2d9b21bfe06ea7989aa8e2138c0c727eab47653ffbd1dd +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f5bc532b1cda687ceae17d4cd9030f672812f65 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9960866be3e91c295747830eb1174c66a21bfcbc9143095b40e6e90c02e83f5 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fda27da432d227410989036638b219a52a4b17a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afbf39961a26444654d750519c4d104ba135726c9d875751959a6f87eb221f97 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..887c4cb860889cdb87f3ec490f278debc842b34c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:987be3ca59418f5bc2278b48093d59a5ef7354761d50e7e7e00850b46492f043 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45457f8595d61f0d01f6f02341e8ad30c4a6414b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fd395c4d9ec4f211c3a69fe76df54e3c54aa993f3e554422cb136df00ec9120b +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b60ad3e161b27894ff78d79460a8f880c865210e --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:800fd79ee3c04ce60987f49b0508e0ca1bc307ecd0239da136c9483afe5e601c +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1756f4b74e3cf3b49d452eff28706de5aa59f709 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fa7ef48fd1e9573322857915816e84131aab0dd11b0a3250c40328dc5095649 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2377cc674fd63a94a6a9c705029d1ec2be58d8f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45d0fddd9e9ae687a97d0028fd0a0231e93de6f53b76346adbfef3a16e51634e +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9f5fd9b2f64642fcc2247b4d4ace505c7097d8b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d06b69f42d9ea4a382c35c5ccb860bae827fedcbfd7f8657689f54e5db39a4d +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e384e1b5ad6120a4016a54f28552891a1b7259c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6066a828124b2e9d60889d24036fcfc32eaaab72418d21cd7befed8ddd18f023 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79c67c0cdfaa2a55db9d99b568f566164736ec6d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f02198c16e739c797b2a4048416d0ce60c0251f503efc64915c84638478ce77 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..856e99cc86a76600c034850c2489ba4aac3784a3 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac0a81771ae747028bcda4702ce66b94be02424a3f47e78de32e77cf45d7b920 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a5a05c44e18e8c4ddb430470da859081581cafa --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f220429c66b52d4971d5e72ea82b10a805915b1f91a27c07d9e72fe72af21cd +size 199058978 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a25cd97e7f76deeda79a8503a252082d1b3329d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c51d1a209721ed38bdcdcffc6f51e346efcf8b588073501c44f450eee179e780 +size 199058978 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98676d357d004a409df6438affcd2830cf54ace3 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f3efcb6ac9f1998635a54c7a74d8a9623752a9fd8c60687b1b96637b82ec4e8 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..588b637f2cb3cadbae084608178bfa274d0e2e5b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9ae2f3afac50491cfab1539ee194b33def95255f8f147acb7f363f9987a421a +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..673e02473b2c4aebce4a9d790cb99861f67e3ee8 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db58fc634f945762fb83c5d93956b742cb5d67ca17699d82e31f467ad1c47ece +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2405fd0e3e552cbc52279c64d5edaf52a9d4e39f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d998822dfb41fa82e2faf26e47622580434f20b13eec1eca2d07fc30a25ac77 +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4eecb7533c06d246c190b3be1d990a0efbe9d5af --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e2458c80dc19fabdac418e4199744404bc3443e90b4f69e388f16c6534f9dab +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..381b7db38a006396f3a77200f571340fb0e14a30 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d02fb2573fc04b00af9ef8f25b656ccc0a93e776f34309a172dc5c063ccaf8a +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dcc7588bf015edeaefe116d2e0527318a7244c0e --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49d91699bbe84dc5a9fec500dd7451e3150b53a1eb4231170139aa9e7a847f48 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e155916461948f12351f79928c02e40151f4be9 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:703694ca085914e507802a2f5593953a09d971dc689817e7a7a35703c9792268 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f79d81ad56e515c90c310498577ccfb68c1dddc3 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fed6926ea386fa583535d73a8d62b2653dea6b54cfcbe3e307deb6210a51db7 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f7198bd4811a718b2e8a663b88ba4f5ca56ee56 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:608915e14a78e60e515de371bb74b9d691e789a98ecdb6b5e1aa354e87e5dc5a +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a392e6a0e563f8144a358e0ce7fdd70b5d96db52 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3dbae86fac58c5507eb0cdaac8b25ef42e4373890741131be981e4de2c3cd83 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..504d7ea0f8f2f83d29b3e30041f5e3d04e28d738 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc0e4edb4ec577a86fba01387ed9fb40ab271290a5b9cf49ff01d33ef15d502c +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68db4245284add1ba42883b8983247b6fa766c1c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4a7fd795b217fe033efcd8bf15fb5ddda6d0bca0d8b8c1a7f3ddc67fe01d5fe +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfc0c0183a55ffd5cd8b2b4d7cbaf60a42196de0 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6357e38c7e2f056eed4de2d2a39a023e7786522ad21e76a22b47baa3a4e9430 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a3260fcb02a38ae75ee64346b7927ed31b4117b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a7aabf8ec123ed2b049db1dc301f82857c7e0a0c6e1846c319433d961bb951e +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe1572ee104d0c8265cbe30fe3c788f96cdf17c5 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e714296e23f302b9a0ee5dacf537b71ee46fd94b7f3c2ba0e8b323f17040dc3 +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8469fa06251758d2995fdcb65e3ba0edae14e6e --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66d4ec63f2dc8d6553f9e891e9b98101c73c32fa6576172031f7c877900186ff +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fb47ca7d89523dcc0064fb1cf6f4f8a598b0a9a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e9f01d3cd6896a1e9a4b4564331e6ecfb99578ba7408c9f419dbaabc4ade680 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88cc63b4ccf9f9037244c85977324d1a40888321 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f444fdb81c2585cc1dc3eb05373bcb5df6fa326e80320039210a09a2a997be47 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6aaf56599f88cd38d6bb87262fd975bb68810bf0 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28495bccabfbc0719fe89e30e9e1202bb45c69c20f3d9b46fbf449f7afa3aefa +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7c242379dfc674817cdffb6739eac4a5111730d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d323573236a90c06d28d651c9101b088e21df49aefe889c12d040b88ae19be1a +size 199058594 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acb52eb540e97dad5429eb4d2126701628db2466 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3ce256e0b1beeb9c72b9d7acb16aede2a25b1ff858a7b6a2cdf468f6d54433c +size 199058594 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f34e210b966229c5ec6b3d9d602123a00e158fe --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca8b58d0fb22d31cf23fd14e1484ba394bcc827f51763e3a427cce75f7538131 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6eb7c197b53df4108e5e73dd84164dc9f9fc127 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e84bf144ece04fea595c9b2f948b5216f0ce47367d6ddd9bfc36708ed71cddbd +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b44622fc405c014f6f1a54d2d530c7ac5a12d924 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c1bc5539ef9d687ef7af6ded85f9b535030d529a28e75af002b2116b8bd516e +size 199058711 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36fe9e0d045c7e947e56341e18d91857d813a462 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5145922b9be9f120d96e4f7f2a7f9ea9661feaaa8d03361442b9695a2dd8d503 +size 199058711 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11d385c65dbe8e6ef4aaa138b7bab7db3c26b310 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e8c01256eddee8bf26242893870b777e935dcc75e9c1fb2160b0c9cb5e7b081 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b961698f4a6557f86fc3eabd404e168a3abb52b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5640b4a17f6a1aeb606dc6855710a23f5cd8f2bd5847f902cb2d958b8bf68afd +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb618c38a2456859dad7a4c866aefffeff3b74b0 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72b82f9b204dcb4cce1e3625fad96a7f8d3e34eb2069d8eaa1eeb26598c0f231 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a35423516a561fc01758ac7eadabf5cd8aed3c2 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf147d25b1bc972c1e6b585d3ab86bf98176746f81c2cdb25fc36acbf9fe917 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1403c10da6b6b61263c323e48f234ad834057332 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdefe623621f1d0b362bfc65317d9f948e49af2b49ea2bba8914744d343b7e4e +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1488aed934076747a573ff5ec9a2ce2e0eb47628 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3e9134d60fd053da133c987b973d5746482c7048eef140c175ac99d48181e88 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cb834538999df9995a57e752ff188b3b1aba03d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d267202de9d8488ddc0111d6a6eba5f0b9b52eed61213221d8c27428c3d9aae +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98b5ae321da7cc99e1b3304709ff8c9b6b7e4598 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a713f440b06295f9eff9bf01cefe48902e9faa7911df55a31e740729f893f449 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5926a4d3bc7d589a360f060e90ead02915ebec61 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:795bbe83dd5bf8c19a4d9ae1f731306e4360fa7b11158b0a26e4afcab129f9d1 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ece91f6f37c51ba3d0f6357f1f0cdf7b9b442fb --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ff9f5868ca30114a38c412cf5232cfea212460186f8e949531d9d4f7b673c67 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2bcefc8cc949bb615466030eb9156e7adf95717 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf9f6f687dfe6bcf936b912d059415ae84758896eb130fd69b58d9d1bf2d1cce +size 199058594 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1acc0b409ae5e8a01454edf6961fde1dd767fd5 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87262f31e49060fe4d6321828db0c825504a3e5a2c2ad7edde8047418757c482 +size 199058594 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5afebc7ea75d47947ff0277f6f979b5f784ef95 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a10ffe68b5822b86d25c15c4a9a2b47a0825e36a29dfb3e3169593849a37522 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac71299b5d9db7d58000aa19142c9a7c2c13e977 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab8caf5129cfa68857eb6bda8450b84c3e004a600ee2ca8d215d22db15ab3635 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c2b2f65599516d7a64410a1ffe55e6cf91ab00f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ef981a21b2b3a8071594e375879562a5966ca8f44028eb8efff5235db73dd33 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b6bc67416b96b6cf93fe4d9c8af64502dc3d738 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62498914429ff71968bf752b647bb27019fa4f71c6c7d6de1c77fa9c755d8bdd +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd98e5f31132f63d026b3bf1b4268747f3890683 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6313fa471c947bc558fb698f3f3b49fcda7bccab03bb1f13c1e4ca6c738515a4 +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28dd0cb5f5859c14fb86261ffbc6a84a7f04135c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d78fc808cd5a7661a731dd0774a24877118b461182613bfa1087f33906ac901a +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6affde196fc1d1e3cb07d84279d7855319dff215 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bd8ba9323ff4cb7c47eb1e68bda5e66ddf0da54f469c4a508ba270bb7f085b0 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3dd4f8dd49d0abca5e86a10d4d16a75e926b816 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dace622bfeee5aff0a1d38aaa35338fe0be958633547cc08edfb91309b540b1d +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f51d79b306458c3fa369d018e43db07fd2bbdf54 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf3ff71d67911e34d63fc8c6bfdaae57f582c9c00aa21f9e6aecdc8de170d202 +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e0440c41e36aec1c2b3866342f76e43e463b915b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c39689a0ae28d768e943b5a50fb65f84391693cf066769609f0c3b018dc971a +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4cccea7dd3db1a709e3bbccf636453e01b77b8a9 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d563c3324d0e137f6c79a70023be740238b581d7260a78398ed23083678cfc90 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cbae680a1b9f214e8b6d49e2df01d86cf829c33 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f08a8c575df561a4a33b15089d06c632e35faf115f197d97ae4fa6b475cf2c66 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c564fd94639a6eb8379f5e67e041c22a8c41708d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36a9492f66170ff71880fb816ffb1171a079df551e06d910ff23ff11c4dc9ead +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0309d3a70be05c99e8230ffc19ec4c51d2d4db38 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3333ef84dc2b56cc411075a6566b3656d54da9648c49cb2b6d8d2a19cf774331 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..844c41608300fe858011c7f1522834cebea59a33 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81bf4446c3df715ab7f14863e09ee7ac8c1989e555293a562eda39964d2565a4 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3540b7cf33723e1b8bfd0344b970d9d1118d4758 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31bc32ac570705652e0ce7f1dd1c619501a5585ad4f308772a527555da55576a +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9b3f4eb3f7074be5d09fccf8d20f7feca1bbb60 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f82590576d952d497e82ac4e4fafc977a37a8cb117768b769b0cf04a4a9b11f +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74c9e065cafccea6e00c9edc325cb2d15355722b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0ba9e5897e1fc061f6684f5d10fd330e91e6e395fdce79e0df575e50ae4abf7 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e74c28c6ba188cb58643d286b33fea8ada8c828 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c956f11d1471e7f54ba35e2e1cd5f588feaeb9c28bf36cfd2be63b43189e5c7c +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fd3fa169aa41354d20347f6eb9cb2556cacdd66 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67dbe06f5ab2e7fc4784408a400ab9956bf7af61342b05463eaea1aadeb0238f +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d933a11911997738a0f87e6a8fc67174ff482c7d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:844b4bd18cc7c164b2eaea9ee85660df0770d25d80a0ea920ca1a59a00162def +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c00734ba1249decf6f930d603fad43045f858f16 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66a6d4e8fe2968d40ce4b22ae6cdef8998420d61f4e787190301cf5e835a4930 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a24a315fb55c46c89de3935bbc0c10f5c68bfc6 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5c32db96956da39cecc06f0c188bf862e63edba1d09a0c129369f731846fe0b +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..278c29d09bf1ff797502636b8f33fa389aa3bd52 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85d4f25163fb46f03e89e68e7d70c5d6ec25465ba1d714ec17fad205b6d58469 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13831344be1671feda8813343d51463078448cdb --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0377a9cabcbd5afd715db18d71c1524bfdf8353986c65c85a5dbc2459a13cc1 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9611212313210f3db9ed4976ffccdebaa755eae9 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f695ca9639f16442254d9ae792f17475797246ca1a5e6118456f9d929c3dcc4a +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8e744e34e58e39976592dbe296b53306b26eff6 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7da02b46d17e4719b27a1db0e4b3387ea121de2a47d7ab8715aecf7ee5c5a558 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39cac173a9f3d63cf29e3f2239b02445c218b712 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5df49a55a5191afb8ce35a61243bddcc0ed4b3e0738a8ad7f1ffad4aadb6da42 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..637d74913c401d14d2f1d07f21e9824fea22604f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5e1c4f8e984f62448dc8e33931ca9b7ff5b1f3723ca4ac5977bdcf42f1bc293 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e98732e9099550af9f6aa4b471415f075035d149 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a791ff611091dda47eaeef8d538e17095d50271b97dfafd3866b2061dae70ae +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe4a10a7c1062a713e07533638ed42c29cb64287 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78dd7b74e4ed6072f567ef4a4492ff077a133a145dbbfcc6179bf21e71a6235b +size 199058775 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a217ceccf50e2acdb04001ddea6abe32b9f81b7d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9bb38fddb9ce99bf901fa65092c576526ac0a1a612f36be5308b3c3c6f3ee78 +size 199058775 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6204aaee7cf6894b4f2aeb1a924462787714fd12 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cab5df7415a5ee90c6a70d2aa0ddf666bc742364ed666dec2a26a504de6bdaaf +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46f92859e6711047c3114d206694b4a854f2a601 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ac04a5cc6101c3cd328fa3d442795e92a849a0b9c615648503247f8959cc75c +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee4cb4725b8cc079eeefa9240262c431d75124fb --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3e550008c110a3155a261dbbbee1fca79ae16a8a1e22b58d241ad34448b396d +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c5da7c4f2b133773891c7d7a7f0a845400a4952 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0003041fd2c6e2bc2102f6618e25889830bfe584228db2d4e4b792c795d1e687 +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e7eaea017aeb8b1ae4d056a41041e7e96e410b9 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75d41629d8d625c445e70a7adab6fa95bd8d5dd83056c7f1686fd09659b62f6a +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a961d78ea124286a6ef2538278aa4068c9388da2 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c84b94e2f93e6633111f05a813b8e233b4ff7efa4ad253e07a0fdb3bd572351 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0a1cd254fcfb72f423ba6c93672c5e1fe3315ac --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f50d6a328d8c18b10440eefd6b9704e1c7e8bc665fca8be33498be5c3e585a2 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..284113ca11192e99a423d3598f16cd1cb9fdd1fb --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d000a7840ec09bcab8855a9027d6ba27119f4abdd9058e12ec953c04a8ebfa8 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c5ff32dd080889bf6a1fcff7a475c95fd989b7f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ccd0bd1b36e776f6a1425dbb18ea59d21988ec58a5cf3387e4893b9d5000586 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d729ade6766de7c0d76def945c6ddbab7666cf --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2157976ea84319716d2254e3f50c537d77c17d9fe456a2afaaf4452b48cfcac7 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4644d2eb2de708b322958913b84d251549967531 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb88769419cae7eedcf01748253cec52fdbcf8dad3ae56a810e3951a121e2604 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..313a5bf868b57d98f0cea114f616adcdd3a7402b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dc5c3daeca2a757c8fabf8df6102711c4445506c8a4d9537b3390e61c3a7860 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b67cc031bd99046740b4b05e5308a3bdc929bc58 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee94d9a10fd47c2df214e4c3fe057f159bbdcbe8e2b88903f30829e1e7f7d57 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..146acba755d8c4a62b99baaafdce77f1d4c61f8c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b69c11943b52a1d3e6b5e3a78c7545d26d9312f8d2df6d1b2113bdbeb0430011 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40871f440e0d2b38b96ea11cccd7ca917283983e --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3552365237a8f6300eeb1fa1c43b492c2a7e5dbc24863207263a29ccb7d28912 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6df8acaf170edd37bb7f4780ee9562c991c99664 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:614c47220550961919c1fbbbd509c843d2bf30c26f2c336a8e01c6a76d8f5fa7 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1242a977df9f02c3d8763fbf5ef3c5ae75cc2679 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d687a4c79f2fa61175a7d75a6f252fa5482d168d9f722ac74511729b9219b020 +size 199058914 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cd46d62f2952f0c9165572c1b10b84b29d6aab7 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5064cf6c6696374c196b81bb7f378151d63c1449b0618e7d8b9850057347827 +size 199058914 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ddb82dffa043653e33b0d867bda358e2d7d4e49e --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e9d341ba7c1e2786f0e20843d930a2b1547fe172e9de484a635339d0208f998 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ddf2be999292e88885f52594afd15343ab36278 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa36c3afb0c37d672c955c809f65a8ff0b4d0ba7579096409fe97a7812217bbb +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc8d6811ed78c80079105b540269c126f7999840 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f11660b20d9b041557bc4a5132c6d07e06e5fe2668b0bfad03becf64bdf5d02 +size 199058711 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c65bda14b3d5976f7cc713a9bae6f53c06daa82 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e481e6648e3aaef34ca361d3de3bd3df4cc71b419e2922384d7a5733afda5b8 +size 199058711 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9903ee5a9695aa92c193fcb11281ed323dfd61c5 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:391f9c5813e24e322c5f534cbd98da1099b0ceefa2104f98eee55c06f81fb4d6 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8eee1d12bd58dc19079af0651dfb9774669ba2c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:261853e8b0d7fc78004b6151b9eaacae6d2a93c266fc2e3663c70aaa238395d4 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2553c7f0403cd7ba3a2ab76b611b46f2cbf98217 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1fb1ba06e3be8580fd8d182da4a3117000abe87c6b6ee946929c77ebb0131cc +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63938b83d118196a8d8ef31aa1bc0ba84be4ac1d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a772be562981ecce77265aa4bf8c0eca07993da611eb61e4ff46018ee2f1e098 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b9143038689ca6c9be82cc2ad89e09f98f419d4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e14904fe54db5c0b78ae1c0b7f9ded40a9887c4b79f153fec68001d2c346846 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14ff49b6633811640f3ac7134a69b3b7343cf033 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:967a0d41de85e5c4df2c9cd535a8b74d0ae1684c3b183708fee2914cea01713a +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6f97b58ae93e88114b4ab1b5d50296f972b1eb1 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf85bbc00f0e3b11c122b61d59ea06fab71766bd3c16837cb5c7036354c30f06 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e4ab4911459c03097899a1e80d7cbe997f130d8 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d83cae00ee72cc24d75c9af09c6d40d2630f0b87d0795d649d02f6886ca0a5d8 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fbe8e393e90f2b219e608e77dd71fe60ff88bc8 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f039e70e0c48cd15cf9fdc344e9fde3dc598fda59d2b7d583e30d61cfc7c1502 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f57002e200736f24e8d650684f893c475092bdf1 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42d5bce1baf128be840bb1923036ef18d457f2c57c9eafbaaf06f11d2a27e9a7 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cfa9c0c00e88cb0f1511e3615c66f3cba13c424 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50ff2203c446a1fcf54e3ae181c83be0f4b86a387ce476a4b1e81fe404477ad5 +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86fa6a5650f82d670577418e18ee3335b4abc4fe --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a0a2c22069410cbee48d55261aeaaaa4fffeff52b1d3a98186311b5506013bb +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..685503b17e7128d8b9d47eacdf9d1d0cd404e1f3 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8db49321b6f9a1593d0c6f138dd173516289425edfe31e41e9c9028d03ee7769 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78d3fb3b66584a71635891443bd4cb3ccd7d85ec --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4270076952512e2ef32ef91b0ec3ba144283b7f9c2089506cbd0fb237867e07 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5ac5c9334f3b34618f42ad5cac13821d652a1ec --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1bac1bd783b3fe70845ae432390dd79f900f1f34f1ce75e30b7c5003ce021e1 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..369d16f4f65853e51b39fadf19b3a4cefd1301dd --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aef4f1cba43e2206e6f1254813c318291b65ed598e816d4805748257e525f674 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a71a1448dca215cb1d0fb8ed574c1bdf1956b546 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cad0ea41459a0a38cee4dbe943bb2c24cb7928706f9b74e992425406cc4bc83 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffeec7539c8fe0ef2310f61853abc9f1515a0903 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36a03ab0d979d8881253d59bdce005ecc4d5909759c3b1771fedc3ecd58374be +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ec6842d0e1812f59723c322121f7fd4f3146819 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:457164c9f6f08e65a4cf518ba101f288239509a4b105fa5b2d4d53e6b34f5e11 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3874024ebf5deeadc22ad94e553f741b125fc78 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920ddcdd2cdb83d5d2ea1827a9ca53c5bd4fb9a632efbeb472f10681ff601367 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..179d0799e309860a49294ac8d53e60622a24e93a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c685ee77d82131227bf9a7e645bf1725a60dc09b576257c91a5fc480c83e9ae5 +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38b945d7703066280408bd5d7e0dbd556dd2a884 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15caeb6973f539eaf27bc93f4a6b83e352f08b7645824cf96b4f46a5eb5000a1 +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d7df46dfbc9d328c5fd7f5cf18752e8af68ac8f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d3ec7a486b1a3f0c433be8588c7d17fcb86913d67319951aed45efa9fa3f858 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05a1a1ef94d0f20c9067ea22ba47cbb5c622d7bc --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf6dca73942fc4b92afc2308d6322d9c6ad83d473eaa79151f046c784ab1e0c5 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a0fa9e4cbcf07d67aa2c7bbc0fdeaa513012fc3 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb84ad3b3a070515ab597e5aacbe1337838c3e693a4a32151956dde1c3cb246 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..335a60f8d322b00eb99b3448e39d55b947fae2d2 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d60276f180bbde61ce8029428b4f43288730917b2a9fd8ea7ee9d1a4edd591b +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdc94897d2e8a4a29f6680b195a1e85a57ac01d4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df1ed70374644070c5c6618da47e76497ad565e52eec4704a30a58008ab1e903 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..feae7a23a848a9d35044eb5445989267b83ecf23 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2528761851c64e1b93b45529f3b15df750a4b7ef224e3f6d38ef29486f5cdec4 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27fbcb8fe47703997dac51690c549286c84f0186 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ed0be32fd069854b1eb6098da4d4cc422544d2792112da127dcd37bbdb291f5 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68aa286b4ac81ff6599d492fb4ac68facaafffe4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6edf6a5e544efb54e7a6acf60347ec1d30bb4b1df388e8d3d6f4cb6557db45d6 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7527802a5faaa8bf712120f4320862b761e6d20d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:590722bfad7ff14ffdbbc02745874f8f190220e9992d96f6eea8b73e30ece837 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9934b77349ef99f042040ef33d0961c65e55fef0 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f9387f58694aa021c89618daf645ae9a8034be5543c4fd42bcc5fd51d0ac264 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b48f7ff76550d80302e1a18ab057e0a050a83b9 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:397c0fb2a82217c7f14859801af041e316f7996e5cc411ed33db17fdb6c1a10a +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf979e64c03fb8f831bd7bc8f6ab827babf1f95e --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949ac158ad8502f81860692aeb721178d54d2a1324cb6daeea6bcfbf2d40c1c8 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56654eae14ab5cec3da2b0d3c0684e1308e4f5d7 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c52ed0581cb0c0d5c0f3be882007bbd3f298f75c4ae7514080323efc6777ad14 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96dabfa5c769444a0312196f95f025dbe2fbf4b1 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74a03b2069238c75c57001f862fdefff60cc6b3a07fb7488ff9119d8b002aac6 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f087681886e391af1cfa8a0ba1409aaeaef0c5c0 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:538d361bfc7d9270153aae0d49e949fefb89a937ea534cece32b82e067332977 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7adb25fabbaf355b98283188eed06565070d35f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ebfa6762df4b183be4e8ee33b3767f6e3ba9e63f8f06f9d32438607362c5d75 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..643cd1956761aefe37b9eba490ba73adec13dac0 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f6fc84d54b7cde2573bc74c2ad9d2725676db78038ac4c0dbe986e413b19987 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c34921ff154c2b9f6a46c6665215612aa3e64325 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b8bb05aa80598c520a2beeb64c2f8c73928d201ac2d22feccd4a4ab5a7fdef4 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6ead74f066b83efd1efd22920122ec304345555 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c453d1391eebffd2ca3b6cc794a3bfbe4e8f47615e069664bc747fa0ba34510 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f62bd7b8633488abbe89fb9bff5e4f622bd1bf4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e3c83cd32a3bddd49d68c8aea1e2c8a81311614fea3bf82820bb3f4f84b01d4 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..039fa4c3f2be148d6dbc8ef25eb662c5ce1c7cc4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31460cec7faad2216d6ddae9dcaab6dd359f2b285b3755dd3460f4e18d2f90a4 +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8bea901191125fc2d6f7ad4a9fbe2cb84d78dd8 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d63cc7b72fb1dff3912b66b2ecd7cd5616099b7997f3a6dcddaa0e96f5c4504 +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..305d12a77d50d63daa40e5cbd67b12598d57b61e --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5324ce58c0e494629985807796db2cea1d476a3ae37dcafc40bda65a63adf3eb +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1ff0343b136ef06d844e3c4bedec6ae6bc1f64a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:401bd36d391736a21276ddff96888a69a151924c25d9a0987948fdca6bf409a8 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cf5a35bb08c2dc90219e50d61d71ecf3a069dc4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93209e2cf62d771c2d2260e8fd527ef00ce36790d38a0d4227b0f4d5bacef13e +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fa590d7252ef6b4d8e70226ee40effd7f20354f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:656601dae90758abaa64e6b637299d9e247a92d3fd25b959b85c83d34707a000 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0da25151b7a50cd7812910336b3517354e430dc9 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e061d7332c67a9565abc117924f9b80f1bf2d398d2fcf49509411e8806d9f1 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51bd312469a82aeb05c76b53ccce1b077336e7f3 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4746f29b0b53302ddb7e6386d31c88e8c273ce536d7483471bf45ad19cd2a8e9 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb9a56739ed795cfc55b501abb311368d6ddb52b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7514d8f60d171fded9d96f13038ef735176c1828bdd5148576955502e83d0e2 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db02c5691ffbd7f9589227db8d9380cfacbe51ae --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa45cc89e57df494203896ddedbee5cb58a8a8f6b2afbd07fc53201efa5d6e54 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6acf3c2a5c1b03a7233e8db88d3ae0ff657db608 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04fd626721b698d579203a0382385388e2220367dd1f5020e439f4bb8f6c1af1 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39cb698a5c9f74dbdd7ef707a76ca1cfa74c1cbb --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faeb2d23a5f4e89de51e189b7c389e6058140aef2edc786505b7b1bfcc4ae625 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f490463cfc7bbe30f6c2d3a76f81857078f7947 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23eb0ac4fd6e49b7810bc28228027987224ffa434e0987435b9146cfae38967 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d697c0ebe8c90daa02c2de505a232448a3d7d24a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6a78550a35bc3419882edb12532689d70eeba2d6b9a380d6fe25beabb308c7a +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34616a5b566063d39c7c3a6d4396bfe0b540f8b6 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ea939681a93144fc0e9ed1b660aec58c4951bde50882f006375c385e7efe9b3 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..137199a40d39de04a3bd5c6579b31badca46c807 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:620b0ea70d923ca8ca898a7084549b756dda04a0609eabff28a41adde326aeeb +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5be60b12ebd1d56d91aca876da84cfdf3f1337a1 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5925ed008c8d4f198e1594b5864b5d81175825de63b62f6c378508e6c29c0e6e +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85a91ba8d2eb4cb857ba547cf1269ea51b03bee4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15bf5e2f15dcae6f66700af38c9e1e9ec3646cd24dcdaadd0999f1988d025b48 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3608f49d52b6372dbefb480021c39dd0bf7a9cad --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a3d783a7405fde3f6370b1ecfdbcdb059d23523318448e2df156bdccfdcc52a +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f28b5633a913ac7add4f862538ce595bb79940b1 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:475a784e683b8819e11232d2867255d10f756c3ca2292e9505f80c3deb786349 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e6b223fb4c08966be1dc6b5a328be825f8c9c83 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33c3757cd8f9ee849ef472b2456e058317fb456e53798522ff5022b2ab7250b0 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84ec0f8c65b05bdd6615ff2ce3ef2abdb785a2b1 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df908d6fc6413e56790240ab54bfbd9991a2cf43083b803b3057a6f86ab0d0e2 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6be7a235041ff88a64b723fdc64f841245e8746c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab66a56d4b61617bfa2e0674985974c2d3e16f62599a56b7f7b7ddaa32218bef +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b5b56ef5c87168bc20bef0c72b61d28a7d19443 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35d7d45644945ec26b660e5f1b883d73490218e4042265001c8980b174262a1d +size 199058647 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9535f68d0e1b53f8b5b134937a10c0185abc37a9 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d7a86dbce7309cedd7dce487a2b8dde6f51d3f873c7aa4645ace4812a813641 +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be7c7060403b3b4232a5706639961b3dd79f0e69 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34082d6eeba9bdf636d324d52e8835ac92ab08fbb32be7f4fba3b0da4c626736 +size 199058850 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5df1900f1c785a8ba4e976bf5467a17d69485d25 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:80c230f8bc394d26d754871f7a50c5f19dd896140f2265ebdfd12bab91852cad +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..607ebd41db2b97a022ab98485f98ca55fdb627b7 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:577abab12d359df40c99b1477875b53858816710a275b26caf95796eed310237 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87617494f48cbbb948fae108601e61be6f6a0366 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fafb9d2ec2e0177a03c76cc65959e75941e9a70ab9c05301c9529a2ab7c6009a +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c3c4074646d5ec28c49f55b943406783d500186 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5d74924d74a5b6103a7aab088302c6e30342a0667091a199b2e2153256f2653 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f7fe8588c05cb758bce25b0cc1c7b6788e869a6 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38241ad12f78ed911fefbaccfc222854b8eb7ebf004dea19be786c14a81d5fa7 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4101ae8464acc51a3b5f9b3bd2ca6a63ba38d373 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e189caf6e0dd8150012bec0f48cdf8ee24239f65787bff9f4dd1a46a7f31a1c +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58c1b954e6a904fd1df50f9aad130cf80e42743a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9969b7339aa3ea22f891eab0612fce0038661becb36f63a0afb027343755b498 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b7ed1211a8a64097ee9f8ddedfbbd08d01d7957 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1949d8e08297430ca144fc1013c0a3d981232c2080a07087476763f47a9a2d20 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..866db55763b1daa6f388f2041608a3bf9fab4c38 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78dbfcaca4b37699e2f5d9c922d827cba6a551f616f635b4cf0b595b11f75114 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36a7e81193161af4d80c843240df5df333a62d92 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ecd20c7320dac15cecdaec389e9f02a36326ea8a7e627f34352d3d1b952a6cd +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10c2f76dd108a96e213e4e75b3c018e1cab675be --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c528f0fea883ea2f22054fcdc206363f7cc6635bc9a5076d0333f3447edfe971 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2da2a156cf25c6eb34fe8c5008d00fbf3f1a619 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfa863f5e1c122dc0ad32efc9a23719f3edf6ce4f8c9c6676a1da837e0e41613 +size 199058722 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cad6fc733b1268cacc642463a4770facb43645e6 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:500b29757ebf02003d23a3dfc36c9dc9287513811e118e0ff6d41966df9c70a2 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a132e73bb527673a293cb5d6fe5f10709523a0ff --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a18ce2150fdc13d9347cb75ea86742d15fd47cd07c867897398537fffacf9404 +size 199058786 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3024e67beff20fe2de0e128f18738b36a9d9310 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4884ad41f36914dc723486ce44cf42badae8bbb703205e2a15831ccfe2cae055 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3590020e76e9afe12ecb002a993d65d8fab3b46f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9894976fe279fcfd387935e6714cea1f51e9cbd49824d56b55c89fb09ca47e6a +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af70c74b88bc4036cd6d2d572bb09b95cd663e02 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f679958bc736b8f6de1f0f69516983f7f7ad793de9b9350091d04adca43151c +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16e884d4e70bed2615f04b45b5815031cf18c3ca --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0532066eb420678469a8c42a6b63815691808bcd78ac829548741c169aa60fc4 +size 199058658 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca8bc33c8607d8a51617f5349346f017f6d4274c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ed9b9e9aaef38ca8bd2ffd3660cfebd47424696948574d4242f226df9ef9215 +size 199058839 diff --git a/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79b63bd455219f73d9322e4032609b2f3a152eb2 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1aaaca3b2350ccdd6e8c69a8a155556abf1502aad8f31edf2d700f288e8b14d3 +size 199058839 diff --git a/4b284b1b9c4seed2/global_step80108/layer_01-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36580f66814ccfce0cab7b674bd6f84930a4af62 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6469da04879aa3ad9bbee52db114e7247cddae3fa5628ae4d15e893e3cea212 +size 167511299 diff --git a/4b284b1b9c4seed2/global_step80108/layer_01-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55cb4e97ce94dcd0b2a330b1fe2df7757fa0e7f1 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e392e0ea90304efce8977185dcd742e6a1f4178f37236a71a24bfc65e38fa68 +size 167511299 diff --git a/4b284b1b9c4seed2/global_step80108/layer_03-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c166ab9aaa6cf250c934fa4fba7e333a8c33673 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:338dd9dab65f0c2b5bb62d809ded55d09f86e25cc6275bcaaef5712325a6651d +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_03-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ec40224374438210fe7d776e9baf823fc258f43 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7667ce71ba84ada07df2817deccbb510920072bf4df09ba0c916a6d9f4d0382e +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_04-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cab536bfd89c4fa73f9d3d3b53eba27d997a3db9 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acabe0c15c7672c87b10c9ea0025822549abcfe1190013c1f72f25f2a518ffef +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_04-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..434078d9cae22dfb6a480f46e594cfba1d088bf3 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:448c4eafe8f785efdd1818eced945d560df9a47724f79eca54cab1ec50c3b113 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_05-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..661a7f9955034a8c1ef9fbccd3e5a83b409df75f --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b6808cb812cbc9e67ccab2865e2e904ba7ed00f659b3c4597e7f7f752dd41b2 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_05-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..958f3dab475e12661d107f90bc94ebcf6d1e0528 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef54b44b0aca3e660ac320509f34def592969a566d68d22ae0990077ccdcb6da +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_06-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..389e447b3c7be8d665b775fd29fc24d1bd4cf0ac --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:784fae96dc5eb2ed6d7021a97269248f8e7a6751ed7a12344e166c19e6c51eaa +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_06-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72eaef071855a26255e6f55a257aee3b11b80d91 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c856c6ac558e523dd06f86be84e2a8a443409325267dd9a882626df3cc0beb16 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_07-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da62574c4b6bcad3a3601054e11eb21687eb167b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be53fd72057f44c0712a8f1ecec35772807a1d1e681297e724d1d379176f4d87 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_07-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86aabfd2c6876fc5c801a3eb0aeb95d4b9787a73 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd2c0ee0efec4a83624ae9f5c831bf5e1772898fa853821a241383356a71f427 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_08-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3db9dbf39f382b93bbb32999b51a91eea1575c2a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:206e64d561d8bb44be1e715055ff5b2b3a0eb461c2a4e5e191707bb041d359b4 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_08-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23df40e4a576b82a8a433fc4fbc0d24e10cae718 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbadc6751b5494d26cea2386e5a5e41652462a27a0402f89eed90da35c0fbd83 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_09-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67d3959b6b0aae584104d27fcedb8ae4c403cdb6 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4cacf40e3927f4d371a19f24a60ca7228a44f7e57b7dd0a122caf3bb34875e2 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_09-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..693c8a34c4bc604be462dd442d0dc158e76b5df4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc45b6353cfd43c3ccdcaa0216f290aa3e91afaa92c70c3e21b8aca2961da8aa +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_10-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..527fa206b30f218297e2a4014aff639de3a58e86 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:059ec2d27c50a5213e59c58057e4ca9f31f4e699bab150541b9b474c2ab9b917 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_10-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6fbbddc75766df3af876f920109480d698eabff --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b6fcfc9d6df487b4bf28b0c030b5d61ecbf7d45ef8b7b00e94656657db58cab +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_11-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f9141a3887df506c258c986d33105fe99785ed0 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92a92d8bdb98fa544d68ddd8ca4c24c2f5d0899a56432162af4e3a0f7107e1a6 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_11-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ed0959a4ca4c8d679be7cd03a5164b01e1220fb --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c8f9e0967e3391b586a7a75f3a7b5c126dea3e1182e8e605eab1cafa76035a6 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_12-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a7b3b9acb71dd29549c778575b07335830fbe32 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ab684b22af07a72751df77581c2313d88ff8629b7c169cc2a80149c1895a651 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_12-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ba38cfd354480612f66784793a5fc17c5b26e53 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33616893dc8fe8b93a06a498e55bc4ed367ae3d69601b9bd67e5df9827cd35d2 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_13-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdc8fe440417a91f00099676b3b9e0710a55c1a9 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f02f9df59d26fa60e711e2a6a73b106e018e1040146b31fb944d663ae4b0277 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_13-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99587da9e9409a41a3b559f14e247b280eeaf7fd --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d431c3b03516101eb358423ee2a3d1c0aba098bf177b6fe19a29cf8f82e4e216 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_14-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99ddd2658e773f2893771f1b11162074d7f6e646 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d29511f5c664c2c7fdf0fca6db3f53ad51c9e3bf9a6750dc38b1d305a212ed +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_14-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..082a5a30b5941c4774e4f70c3182e26781c8970a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e9cd9362f5b9ac0d99399835d96ddeb2eaea62ad65a77d964f056601a1c2196 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_15-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..884c3feab6a01084dfae81021cc7c82e370de256 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:361ca30459163253f4e95bf5e2216d3c93767597989dde2b2337d36ff68a9f13 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_15-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64de926f64c0b90358aac0e9da3d6c9cc1ff33e2 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e296aefb78c8a23f21ff9f9d6356cff563bc810517876c740eedf5712edb0075 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_16-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e6b83ca6ed14988e7f53af7af0fef5859bc66ac --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a9668569403bb9df171450761468337b280c5ba303de40a5e20dd1480bfa99c +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_16-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51a3748a2b546fd32a111e89daa31315c71d04c0 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8569e3d486895c120d2cf000b776293b09722b8d4d9da552f0be2601c04ee7a +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_17-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86be265d556d00f00d6f730a664f6dcc330115c6 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36bcbce8ae6c545dfc43eb2afd9fd0eb09da41c6ab36a4e95d427593d9814b27 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_17-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f863b3f0fb4f07ee059a99fe5443a4d70b3da55 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97ca113fe26e66c75d62ca80726a1e053db14ba62111e0c6e2ef6304484c9f6b +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_18-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cb6afad6245636a863acd0358da701e57b9485d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:181310305bdcedd407aaf4ca1f0b67086856e0e029a023658808b332fcc0970c +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_18-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2087b6f5260b911c7d0afd1106ffd38cd8c066d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36fd585e64fd2a433957fb7630f768cb885b00da9f8e0c5c437ab94debb08518 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_19-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..024e850e414e48b9d6abd8a1d1bc41c8d0f529bb --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46a07013f652c4c1c33f4c4572e1103b8a2effd471b482a38293aa9301b0e0dc +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_19-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84828ad284856e3463ead2f82cdad0d6e0379aa4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2a456f49fa5a7f853c9386bd2ca4dfd6a1a1bd4882eda08d0b353c2de6f3bd3 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_20-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72c6702eff8fdd57b924ec8e0110dc8813758a15 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d494145a1d8d17c1754a2877f2142cb6e306e320c17aac7fbb5a63566be131be +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_20-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7721ab88cd3587452b64723407b85dcfa2fc493b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff9d9a3d0401951ed8261bbd9ee04bf984c1ce68c8e60229d3ce8b02594a7ce +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_21-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44b0c0f81794b837937d7556b08e03f8a8aab65c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d418e7f4d0058fba9fc23717830f7469a4c24cd397eb516100e72190c895258 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_21-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd1edcd7b0baad0ec0f34a42f0072e789e4debc4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:533517daba8bf1dad61c91acb26556050429b9874c83bc19ab16cdad87e87942 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_22-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89afa7346b1fed87efe0d18083b15f60febdd1c1 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92fa65ab01dc6c950999c798b8e449e52b220c521d2ce08a0f0ad0ad6b0b5b8c +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_22-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0a1d7308494f6e41c3e51ad3c355a73ff46f7c8 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af54af6318bbbf2c8b6ed0ff3c26bf36627b2a063b9f9e7a8bfdc53e52d6f83c +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_23-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25795e2ee5d2f8479d346ab8ff3daeaabde670c7 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba17e25af98f838103acdaea342239f6bbec8f1635f697f0a8998e9cc63e2e38 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_23-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4d70761fda2512dac250606dba59eabb4dff16a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09df1e05456b7eef11c18e2d2676f80cc65291add3ea50a3f3284568457b032e +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_24-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7082cf789f9f65b7a21ccb23339b48e53e85963c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1400763f1dfa8e5511ce0db2ef6e8fd433cf01db1eac5f3eee844078522fc1df +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_24-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c400840fb5512061acb18d0aeea52b04ae44ae25 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e90479b122ac92c8e1b8455c0bc8c6c803ddee41c8391afcc6d561209a44f92 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_25-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab03157d693279c3ec8d92b7ecfd434442e51078 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ae2c719cd6e357dc03488463318de2d9fdb96dd7cefe2091e2203f4303dc0e2 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_25-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85b681f96fa34255a98505bda7afbffc4a11e9e8 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9173eae317fdec82fe347d72fc92f0e38cd9436fd0c3eef66f66f5754d25a4f9 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_26-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..636d2951143546f983f39bf77f93bad8146f9706 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd6c26565e388b92cb2d66a29cf8f4980d36dce00876b203151309febe326f3b +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_26-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58782f25512623f7bcc71cda729902fdd080635a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5212ee33e028d76a5d82cdc5fdc4111ce4c52f34c0773391fdbdfdb2ca1e8b33 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_27-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88110d5fc747ed292943f0f3b63f961b6ebab1c0 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26332f734a438fafaf60d5e5fe0e22223a19582fb63a32bde957a3ef6c218453 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_27-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54e685e5697868562a8430dac4faafb7d6106796 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a061fb1ef612929b8186150c89353a3ce5c5b64f42ffe56e8857e8188c012d4b +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_28-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dc80ddb9b609aaf8aabab60678be44604bea98d --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e470a34a6b152db02556fc0f64ab424616469970ffed80fdee57233249b5eba2 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_28-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e5bda56d4d599221b17568663d2736028f76fe60 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18a5225125fdf7b02cde9d99cd518010a4954f0ab93912b9932a5647089d531a +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_29-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d71a52519c284e5239637c819a018149d88beef7 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0242792f161d2bab0dd0d3ffec96fa29dd08429be97ceb8eb61ca4697a852110 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_29-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4dc7b8dd7931d4c6d4b96cc33d6077d45230cda --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:086d833a1655bcb30e6bce963a47d5f96b3f421c12214fd3b301608af6d1013d +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_30-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1e781a4cd32720350bece5d366fb10a4bb9aa46 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47ae2e6e00b6dcb03f241a44100c65d248f396100a1bb19fdc6d891fdeb3c662 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_30-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be08757e2142fd84ff53c45374f13b397239845a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baa3bbcc84dc56ce48a845df5415793afebd60f931bf1afe7d643a69304fa49e +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_31-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef6fa1e0abb2d9f6f61f741b8d254fc17a9c4870 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1ab44d7653d8db8a5928c21939f85510342517d43b5fc4a7fc9218047c380c2 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_31-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c06806d44812dd531c12d3193ec21f93b0d4045 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:098b9f1353ce2e54f946b352960abcb7c87ed5cd996d36f9d5e3bd1eeead0393 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_32-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5a5277d24496690c16bfabbffbf87f22b5046a5 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a21f8a731282b10e2cdac51809a121bbda2d1d16b28e8145ce2e2293be76d4e +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_32-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20ceac182114f159307330c42829e440238c9a87 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebfce3560f8defa02cbfde866759ed63729f817eca339efb58899863512ff2c8 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_33-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26c3a73b9a545ebcc85addfbc82e7e0d8f056532 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d97bdae1739483e98392d5583e196b9826d2a387100cd66dd80ad6ba3886dc4 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_33-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da078c6930617c947790631ae17ca1d835fa451c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb38ba93e55693177544265f59743b84e638a766a363f8b3e790ee050b484e3f +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_34-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1dc3d62247d085589d42b5233c9090ef7679ed4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c1eba94bee6b72950e7582cea15e7e30933b0bebb8a6cf97ac2285723305559 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_34-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2e05c682f7b99c21bd173ab91d5ac0e1a831ae7 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4df0fb16be9d5601f1e9ff6aa4a60ac2fee70b4947e3f7fce16a7733cfcbc5d3 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_35-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1da70107892858981ae5c3c2ea1549f43af4bc2 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f804bfda7e3dc2058fe380be0faf4cc0dcd855d7733eb49147bc13cbfe9f4a70 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_35-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ac85881ed6aa67c30208d44ee98c83997ceadde --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fb2ce3fb7464fd0685ab8384b506f5596738e92c9f833b8acdc96af879bf88d +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_36-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5014656a3036bbb74af590d706634fc2c924c29e --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:863c4371a44ba034080d4b7f3c7718b7e374cff12a435cdb7cb4f5a78d4db60f +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_36-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9766549c8229bcbddf2a4303ac1deaa3778651a4 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f081bf87c2553ec0360697cc8fd7035c93035828111b9e39e7aafe81448d478 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_37-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..672890ebaafef49e5e82bafbe1e2775d1f9b1279 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f0411a8689587787f299be06b6989af1f34cf370512abe430750b6fa9f6881 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_37-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2931edac63ffede683540edb6ae780a52add941c --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41913bdae4c47913e1b2202b43a1297ff70b3f5a7e64640849018f375888c436 +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_38-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ac6d4193425b7df3927d05d0f2feb0dcec2d59a --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9ff8ef35c6d2e4f6f7a988a42dc21f3b233ab6a5fb939a0c79346c730da693f +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_38-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0614ea506ae3a6dc4cebafcfe0f710d61c8c54bd --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60e82de75d6c6d0a81dc837f9efa268173176dc58b631bfaaf5e9385c76a571f +size 113308931 diff --git a/4b284b1b9c4seed2/global_step80108/layer_40-model_00-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..655a012764f473182818bd923545834d594989aa --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c0efbf7bb3c1418e26a3ac915a2c704fcef2569274f651083b92260cad0bedb +size 13507 diff --git a/4b284b1b9c4seed2/global_step80108/layer_40-model_01-model_states.pt b/4b284b1b9c4seed2/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45048adafdc946367757dcca601c46eebf76a1cd --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f703d328021d5b63d81aaa81653c2cd1d17baee17efaf21739b99689b7ed4b05 +size 13507 diff --git a/4b284b1b9c4seed2/global_step80108/mp_rank_00_model_states.pt b/4b284b1b9c4seed2/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..981828318450d7a20400b33bf59d4e3d9e49d31b --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:397c10fe7b52f3cb660ab4df2cbe220b06b25112b145e7901272323c273b92ee +size 51443 diff --git a/4b284b1b9c4seed2/global_step80108/mp_rank_01_model_states.pt b/4b284b1b9c4seed2/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c3c00b814979ee08c0ef3f9f1030699b0197b02 --- /dev/null +++ b/4b284b1b9c4seed2/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5c188b669180039f97a32a3a098fe146785b283c7ea7d940f882f4830b6d2ae +size 51443 diff --git a/4b284b1b9c4seed2/transformers/config.json b/4b284b1b9c4seed2/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b1b9c4seed2/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b1b9c4seed2/transformers/pytorch_model.bin b/4b284b1b9c4seed2/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..5241a4b663ebb3d701211677fee3fc45d281182e --- /dev/null +++ b/4b284b1b9c4seed2/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bea2a226e7bd0125cd9f9ecf236a440967ba883caa124627df4e1c7e6b411b7e +size 8781203669 diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c3fe7b9902c83c687ad4ea2dc0a20a0735e5fe8e --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.32012773562587393, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.018886919871708343}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06825136821356759, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00237062733299883}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2508286238498341, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004661697991334146}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.0899762528447479, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020354843345656163}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.030615387870315716, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0016384196683051863}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11248984628302856, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030543468265705285}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03944916755986983, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001249719129780461}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06342619049690505, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002233393033449764}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.23548259610722824, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004438251763555299}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.08360285576779355, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018856928971255989}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06406542591417572, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022429625274388077}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.234275763130725, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00433154610375273}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.08427145597780734, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019051123678010644}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..bee713d271f604c6a5e7a1a7e6b860c6f660f287 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.28781282710307465, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.01899808984283447}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0527754711256334, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014904713251823198}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2537614091915221, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004702310798072158}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.07847336913595586, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001535955643926011}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.021533529321543874, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007685776439012483}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.10966078271884003, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002981675456939165}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.032657251493622856, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009264643374386928}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.04876649614656279, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001420498632004972}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.23339792109691904, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004315010087105858}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07228685200884048, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014209363141639564}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.04935178833491907, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014212538671699328}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.23635405366452086, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00434221432817691}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07320160734011764, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014251444099725329}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..f10ee69ec69b6bee487a6969ee9384244d27d21e --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.32085939271138914, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.023874716323242045}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05368960443919722, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013878849609328464}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2687130245556709, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004740106099310347}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08108986156959869, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0015435730709568757}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.022426372869437324, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008085489202082841}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11689977539927107, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00300061931368436}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03412133307095403, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009323084416353588}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.048651633590719855, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011827185282768337}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24511580579594355, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004282778444187627}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07379515479031812, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013763914362202537}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05014569138865563, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001314326894957353}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.24950401790874296, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004286277514587859}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07555165803520482, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014213371826134968}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..c7abafbf19c17e25f06e6b09e815f9d4686d4b8d --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.328454678316601, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.022343422759414436}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.052008963484847605, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014633614953241854}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.26281409902133185, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0047415561831233915}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.07919929805647623, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001514394418998029}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02118860914793864, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008530949812868349}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11276078198061254, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030219172592672325}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.032486553286374405, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008957923404999381}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0471171164690475, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013827485067535008}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.23822249787189817, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0042466165786672035}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07148770019595055, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013416340928285905}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.04892298323961062, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014183478958578937}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.24590296884903542, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004380487268920286}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07424172013111648, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014133679260911725}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f9ec7c495de1e6784ba5090b81daaf0447df91e3 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.3319702594644372, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.017323146780773062}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05459708827196318, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015720228379579838}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2657448353396512, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004717475684567482}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08161632894859638, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0015256642009196088}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.023141351440564402, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001127390810261633}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11549040824815301, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0030025248991349058}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03357767413194358, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009162455741147543}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.04843785490759391, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014543602029517073}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.23813768049670572, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004172909727083725}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07227592144254627, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013148844913734015}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.05090666274679119, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014735025076296423}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2482641520424661, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004326751256652749}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07605405086627043, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014106467606439447}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..4d80564468e2a4031adc8d7e0ed9945e1f71671b --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.39182011395821026, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03017462277769791}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05338210822991803, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011795913375033742}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2739388133076789, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004725041678049671}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.08316112835678297, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0015044194584303333}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02230990790026212, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007134756313875014}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.12067184027915072, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003047769920528369}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03484163213544278, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009120223523826239}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.04760001656977872, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001056801997116071}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2449561247042928, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004191935654465999}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07405669758488781, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013146857723887232}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.049818219801901514, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011057069363974176}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25508548910812884, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004349187676537093}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07747218411731929, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0013880210497301878}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b9f2734b589f77804209ae195f5d665930bc923a --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14881678764247983, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018075069170291314}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.24793312894988265, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002389930611487624}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1723366320397076, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016970728587596892}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.025628754354153325, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006556947869924073}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04387904423436066, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012152943972142077}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.02968820163157077, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007214568491876274}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11061636395219109, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012170197578614795}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19130257812101642, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001903442450094291}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12964957358415072, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001174103551409633}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13872341402711671, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016795577613053013}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23159850567749277, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002229753265274432}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1606987702240205, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015723044572643534}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.2190291379439195, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08836041456372522}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..0feaeabea068a3e63604f7a20a02e9439c543533 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15240917543961252, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001893453848440131}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.25542377808907146, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024641171624728577}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17711899758881897, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017763415721639936}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.029132226950407722, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000722011658200494}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.049639629425446356, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012773856244254617}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03374713766036158, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007818322344438194}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10994692166995118, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012260681075949413}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19293230076900478, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019284923872095526}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12974115857300988, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0011843934409556005}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1427583503702487, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017641069847062667}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24069300754030848, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023353688459108405}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16618151783978977, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016552458293647842}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5590008346037099, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06892531048465908}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..3733a50f70f24ddde47b3b5863cdfc6ebc86aa3d --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15159610505617108, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018921710224610877}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2536664028604043, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0023916817331507876}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17612683398478715, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017563955053422117}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.02782910309662972, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007111400329440863}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04643317452251163, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012211811473359306}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03193124516131047, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000758958083313296}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11083516090740873, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012614447636676077}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19352563235261244, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019031906464486539}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1305484526211359, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0011976224297953603}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1424531837738363, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017681228614650911}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23940558197543957, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0022600581442295}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1656855868051239, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016384579347020886}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.423539576651847, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05590338188617223}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..dff5805275299549ecd5959b4e89cf8226641d1b --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.13298493032742092, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021599143965991448}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.214129162398553, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028318625372094723}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.14896513024586858, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020016614890125467}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0244781955065012, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007307175719718521}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.03981635760280176, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012026016154760618}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.02730656796059889, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007432758390663112}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.09875466672002745, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001559084136737345}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1644184900777515, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00222028334382692}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.11134915972896199, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00140777630827098}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.12471488513914283, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020316307804283357}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.20148242502649036, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026760218524170916}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1397033192660591, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018672195336514297}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.402481855726376, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07496831085827607}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..46e7252311fd805536976f85413fb40576659934 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.04578189123199333, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017562670636657443}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07399147773842517, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002550315174376835}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.0495274627219381, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00169718420379995}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.008690556943839151, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006452419871034267}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.014071929895195552, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0008009026229828391}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.009286374730690028, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00050108884216674}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.035008115979705615, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013409826184435712}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.058241103416270305, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020319511583359808}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.03797030362668432, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012710366329130882}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.042745554189029616, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016289097623771287}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.06929822143002932, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002385334871151041}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.046311955140639516, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0015800586441838697}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.3627379747836102, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03354762768029023}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e8dad8a72890e0133b6680f13a7b9a623ea244ca --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.0074834967426424225, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0007736454980237687}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.011934633047410595, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0011163746139347308}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.008032143708786618, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.000769380549886739}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0011994561802445166, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00018233396610689006}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0022243917557991503, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.000328054783161663}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0014060293109536969, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0002040774536152345}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.005527948528114916, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005645889276529973}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.009193511694802203, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0008680965592063552}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.005954377693063202, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.000556855926391102}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.007022799151439734, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007312149938921309}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.011189580936988842, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0010462966465602747}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.0075115815949656104, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007197306094579381}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 5.170172033055458e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.1813622697325427e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4c765c5a799e85efdbc72ad054214be639240209 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.023059028483234455, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.009986858835187516}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.08646635544730007, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00377831577985332}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.031635634606258116, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.001269300288541845}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.038140802367729314, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001495094420064931}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.03990955933185571, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0024489170391253133}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.00853219303645261, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00046389097916627487}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.011993223757428687, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006456302396314265}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.07881038410549088, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0035148627119781285}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.028615455542499727, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0011483835890292063}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.034369983243126824, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013496596592950014}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.07924093489385359, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0035579093389609888}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.027741907284705433, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0011204355268068656}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.033892840605688854, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0013502083491247366}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..d54c8a5dae4a2f800b875477913a2d1d70b708a0 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.92327601668373, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05843145852320597}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3069015502240498, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0027141658342019533}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.39979069436919706, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027344739468908464}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3195090019700737, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019316739490464164}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.11881015634283494, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018726653522764317}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1547177292472664, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018688850569839306}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.12124769523896647, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013611141408615495}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2310708605355665, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0022062598471417403}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3039710432903314, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002265711626940462}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.24042839740750466, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014957834627688047}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2575158229010334, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002504168232503219}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.33420271307698657, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002509091259792972}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.26693221189807087, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017924495261329944}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..cab03d0cf5fe93b670d56a48c92c0d3e4b7ecc10 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.798513972951498, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11353083630417822}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.27602836621141386, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025780345869436143}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4181131170949761, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026506272040465527}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.30806587260671714, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018509005121755077}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.11242493035118595, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017273889338398733}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.17096478516816419, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019293105165237693}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.12337486765629936, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013085936094396561}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.21692521379325555, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020430932459005492}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33431954510893935, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022474731694641457}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.24343008869727828, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014161383440201198}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.23257813200591104, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023360478957229073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3524929035089362, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025454158780705265}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2593626081415107, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017672461865662792}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1e75a936c272b14c9ec6f248c56e11679adae0a7 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.644092780950039, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10217788685749982}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.26161576269851167, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025136188998387504}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.41515437679947936, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002598826549494006}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.2981344592034621, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018206530175075195}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.10693721487632077, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017057516502692433}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.16981690105478955, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019012605105245895}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.11947929128220935, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012973693582640367}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2094840503016106, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002037886584044074}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3376907481718358, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00220926835759776}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.23991261995087904, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014219136572907404}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.22116618474928101, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00229609611848074}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.35126017567747847, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002506017472827367}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.25177947103229636, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001736956932091685}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..709ed6e5eb6b4ef1172fafddda69c850d41f40fb --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.7499537608526206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0771735259601375}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.25565023567980505, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024296319398495005}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4223930509739377, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025959915251734665}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.297032269913346, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018374797196724821}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.10591522249436582, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001656138422232947}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.17476583770251305, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019174634136014039}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.12065447384924378, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001292230076177851}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2057296852438049, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019458009062281374}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3452387295232376, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022232954316674606}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2401166198393427, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001412545210957851}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2170829438014025, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022139919637352325}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.359511646806021, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025629445270113453}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2520913436920952, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001756285809527599}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..974436fddef1edd63b27fd0f1477e86a0c907fae --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.770537159308962, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1190361381685094}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.25787672074394796, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025328256284091236}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.42573900503618045, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025754554062627877}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.2987490942442688, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00182958925425156}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.10790420126833489, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001769950634717068}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1764978054536251, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001953358091932576}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.12169295522428568, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012994307062877601}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.207955556140787, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002097923926132232}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3476137840160232, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002207282217829847}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.24138350753763696, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014118485855993332}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.21954740035518447, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023503093866769544}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3624191463006945, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025392023747063696}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2537764861825883, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017644696653914508}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_0.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..6be7b63d4f6a1eaa91dcfb6e7003af0835afe9c0 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.14542424202725895, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022138246399507205}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.31877105379992854, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0039014668311384846}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1924128186381312, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002360900852656541}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.026751288404993658, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010068959458770191}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06119647795475897, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021992283140675147}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.035715714855404174, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012470772810957468}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10850993070385385, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016022951483510026}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2403257780307599, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0030478006648468224}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14397207180406998, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017392037354323953}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.1137602974676654, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016663613584011713}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.25349408376272603, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0033388300752575585}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1513854308550901, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018706736809661465}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.2602613828624476, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08741245069026914}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_1.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..785122c15b2deb8f5cc19978c2398beb5f014ff0 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10549993650520251, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00153501677078187}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2612212727377519, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0034404286739595498}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.14848707861095392, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020468594975290248}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.013994761205987642, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007149071339383721}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0356140526531422, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017994780886659853}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.01983861975775417, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009966264701985932}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08181009058637802, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011239080238855375}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20392678730897415, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002600805826506937}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11531599073392822, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015026013618598068}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08559803726047839, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001213987918870468}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.21400310748327384, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028528494274868274}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12077280177911864, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016322822837075467}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7915703643644384, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08396451150549139}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_2.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8e8fe741ac37bce5ed2fe0037f8aedf42b092e8a --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10471570168180548, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014494215119621229}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2620545799252738, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003320038801060601}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.14783482736166878, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001930898165701915}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01319945934793176, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006302627050860287}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.03471557162965618, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016776406415917023}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.018873329322073275, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008955667212919246}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08197306181617371, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010777654445218213}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2071426347373322, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0026041548046999877}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11600786897853718, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014481058046010048}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08489744619220965, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0011830647260639108}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.21467503234909532, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002893408444556316}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12019939004505038, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016060029611780855}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.6502670718184665, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05324899628422249}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_3.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f350bdb57860335c21b1e2ada16d37b481db8764 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10410860827262407, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016985601546784064}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.24975935094410306, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0036359468821554417}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1434515966047625, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021396059501441697}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0133838272101195, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006651947823416613}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.032957650415980116, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016410836459370027}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.01863408799342264, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009121268268702102}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.07992461082726765, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012408675788602088}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.1932235805685923, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00277498209308085}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11028077942863275, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015625007588984398}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0839932835001092, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013382454039087637}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.20290901214848292, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0029990659468279056}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.11596810997110246, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001710823422300248}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.72650775578876, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07009722650167388}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_4.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..78a5ee87dad05a470457607c70a07eedf7b00382 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.03133602840154907, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001987959380677703}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.06067401952247452, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003487892178028924}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.037884638019230664, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00214775480739452}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0034573763117096636, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00044354666596204615}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.007156768365840787, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0008508883614159644}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.0043759041403374135, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005183680894634575}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.024472567308614246, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015926598243951066}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.04698578958663985, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002673075415704531}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.029266330660064416, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016348070626843912}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0257721881730792, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016575889068278311}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.04994885638600292, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0028614395409444103}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.031041105487741426, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017460208416643014}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.27256554319567566, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05393365990560443}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_5.json b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..2b15b4226128ac234b2ab93b4a837385ee5932f2 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/agg.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.002422654460959852, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.000701445835208553}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.002150434002930073, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0006364013868075673}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0022183238269151938, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0006462435715584798}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00047185826875061065, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00025359131866297053}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00042238421955403087, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00024978354101036374}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00044144904818645863, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00024927107535141214}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0020288572682842206, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.000585169484066717}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0018274673120388537, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0005474767964183582}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0018677137784396751, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005453913617070764}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.00207399584371078, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0005893776256546286}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.001865187279004104, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0005528638398211417}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0019066970935807948, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005494437621613826}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.5634857131422677e-38, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.7875744611015253e-32}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dcf5eb8b0b1e522b059631d88202e71c59970d56 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c352316408ce68ca3303cc75864eb1a71a8adc5b65bd730efedf3e7c21a64f5 +size 4027240 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3b8571baf1f126e1ded887a2bee684ecfad45d36 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30d5e53497d214cf68522c1c23677f55bbe4ba294131e4f799e3faa8dadd468b +size 5056021 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5a7b610f9cc6237b9540de1086639f6ac4d78043 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:690df19d20cafe834a91eeea44aff69cbc5747626d537187966f41befdd4fa03 +size 5973149 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..874478396cbb9d0359484f3f1e9e19e9e99d51ba --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:182017889d46664d6a286042d2616a17c48c686e2be29accda4fbd57c3c5fb59 +size 6881955 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ea786eca2d6367a27a0c16cd9a83e0f210f8013d --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e63d02946c105937f18a1943684e3e0b517ca36835f38a74515b0934b853f57 +size 7789915 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b214df2413f869f8e4f90ade3aa8f3a5c3a88b57 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ffde5a853fd1a067cc45305c7dccdc60599321ef31191b0be5c9ab065076b2b +size 8705149 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..16a1b4353a73dce1265faa9cb6cc974bd50da8d0 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d418dda59cd5f4885b592bd4b3b17609ea50783e3b81cc8319f8d08418ef9338 +size 7714723 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ca3292fdc13118022ceacab443ab5face5351468 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9ad8ae0ce6bb197234320a81115198d6cebe131142ed0d902d760d397dc2e58 +size 13326504 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..04baadbdb7e9ba6fafa2052cf8b91d54cc64e485 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d41a6286907a53d50d153fa89736046152e276802d92f7aab637ce7b55ce3aeb +size 18925897 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..65c9c721aac8ec76fee673136507fe54e30ee21c --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a129842df973d0690485825116a575b3d3a585f89e899d01d61923f4ca7239a +size 24346025 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c783545a18a18686889825c2a7f11c2e6e0fefe1 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c57e1ac08e1f4f4f4763fd5263123ec31c494c0729adcd478144e0f6ef981ab4 +size 29479949 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d49c899b3dce4f448c7155f3706071e3b079e86e --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0447509df75a2ec82797c1e3e6de503e455c76c8136dd57658dcbe0cbaf8b7ed +size 34801193 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7987fe0b62baa482ec683ee13c4a0e7f7ddaf145 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9c4258b92d5795a6e30413b411a29de6ed9a25aad2ccfbf57e7e89ed1a3b90e +size 3701530 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a11f9cf5799fc43aced871bdac8e0fac34f5d261 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3d0f991a97d672c586a4c86565275426f27c61c40b99c429575f65e243072a6 +size 5303447 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..3bf59518001a4c3693eb61475e8d295a867a49c6 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b93077bffa904b8845a13ba597a0c3518f31196cddd57a460a11dafb350036f1 +size 6475569 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..378371e56a65bf5feaa75ce3d4208d472e0ee5a7 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05c82e92f05b9302e329df36a77d0e8e1ffddc0425248f28e1e4662700f0c16c +size 7586436 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1cfbf06cc3e3100da9c8fae5145f230e157a32b1 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93480e2d56059cc962d38bd99c611577cf4c3326ecb545005713de78bd1dc702 +size 8685338 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7407a773d19c2c3cd95d597513255412cf54fb5d --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a4517757579d471b4e53d2e76450724e19b335b08ab71cb31868f8d45b24ed7 +size 9773162 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_0.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b356fb7b9f9815145fce935c6d54593c01bcaa7b --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:67fc6ad95f5720eca3df198b5f21c704a2e8f10597dfae134cafa9c9b74252f9 +size 2817910 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_1.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1d1c4c4a7ac4fdc02dccfbb27c44089fb6dc0b6c --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53c82907280d9676cff9b6dd41f9f115f79f8eb3990b3dbdaa330e83e76db99 +size 5104735 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_2.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0365142ceaf0c2ebc5f6338b935bbb8ac7b039a6 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:128c1522bbf4a1741f1104e83e2333984061d20f1272967cc0f7ddb4f1c31dd5 +size 7380793 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_3.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..16bf70143c07f446c6d03a357e6f205d5233b8d5 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:283be13932b3fe7400116e63e75836d18e1a0c829aaef06719bb296f3b5576fb +size 9650924 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_4.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2f35c6cffc6194128e8eac43dfc4737b7caf537e --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dff810a074027c6277a2254ab29b4f7d53506f435d64ba5132bd952f27fb798 +size 11673976 diff --git a/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_5.jsonl b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5fe980d60d407f008fa68b0271c1c24cca13bf72 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/examples.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4070db72983d7269d7242b3297e54079a0ced7a6ec77a828f6c939d9ff7ac73a +size 13897524 diff --git a/4b284b1b9c4seed3/evaluation/generation/merged.csv b/4b284b1b9c4seed3/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..e1254d7868ec0ae33c4fafc2cc707487a9aa169d --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.011993223757428687 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.011993223757428687 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.12124769523896647 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.12124769523896647 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.12337486765629936 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.12337486765629936 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.11947929128220935 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.11947929128220935 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.12065447384924378 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.12065447384924378 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.12169295522428568 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.12169295522428568 +e2e_nlg_cleaned,5,average,multiple,0.10307375116807223 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.035715714855404174 +gem_xsum,0,median,rouge2_fmeasure,0.035715714855404174 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.01983861975775417 +gem_xsum,1,median,rouge2_fmeasure,0.01983861975775417 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.018873329322073275 +gem_xsum,2,median,rouge2_fmeasure,0.018873329322073275 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.01863408799342264 +gem_xsum,3,median,rouge2_fmeasure,0.01863408799342264 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.0043759041403374135 +gem_xsum,4,median,rouge2_fmeasure,0.0043759041403374135 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00044144904818645863 +gem_xsum,5,median,rouge2_fmeasure,0.00044144904818645863 +gem_xsum,5,average,multiple,0.016313184186196355 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.03944916755986983 +web_nlg_en,0,median,rouge2_fmeasure,0.03944916755986983 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.032657251493622856 +web_nlg_en,1,median,rouge2_fmeasure,0.032657251493622856 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.03412133307095403 +web_nlg_en,2,median,rouge2_fmeasure,0.03412133307095403 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.032486553286374405 +web_nlg_en,3,median,rouge2_fmeasure,0.032486553286374405 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.03357767413194358 +web_nlg_en,4,median,rouge2_fmeasure,0.03357767413194358 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.03484163213544278 +web_nlg_en,5,median,rouge2_fmeasure,0.03484163213544278 +web_nlg_en,5,average,multiple,0.03452226861303458 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.02968820163157077 +wiki_lingua_en,0,median,rouge2_fmeasure,0.02968820163157077 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.03374713766036158 +wiki_lingua_en,1,median,rouge2_fmeasure,0.03374713766036158 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.03193124516131047 +wiki_lingua_en,2,median,rouge2_fmeasure,0.03193124516131047 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.02730656796059889 +wiki_lingua_en,3,median,rouge2_fmeasure,0.02730656796059889 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.009286374730690028 +wiki_lingua_en,4,median,rouge2_fmeasure,0.009286374730690028 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0014060293109536969 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0014060293109536969 +wiki_lingua_en,5,average,multiple,0.022227592742580904 diff --git a/4b284b1b9c4seed3/evaluation/generation/merged.json b/4b284b1b9c4seed3/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..cd4d4947940cb554983502661747cdb8ad83331b --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.32012773562587393, "bleu_stderr": 0.018886919871708343, "rouge1_fmeasure": 0.0899762528447479, "rouge1_fmeasure_stderr": 0.0020354843345656163, "rouge1_precision": 0.06825136821356759, "rouge1_precision_stderr": 0.00237062733299883, "rouge1_recall": 0.2508286238498341, "rouge1_recall_stderr": 0.004661697991334146, "rouge2_fmeasure": 0.03944916755986983, "rouge2_fmeasure_stderr": 0.001249719129780461, "rouge2_precision": 0.030615387870315716, "rouge2_precision_stderr": 0.0016384196683051863, "rouge2_recall": 0.11248984628302856, "rouge2_recall_stderr": 0.0030543468265705285, "rougeL_fmeasure": 0.08360285576779355, "rougeL_fmeasure_stderr": 0.0018856928971255989, "rougeL_precision": 0.06342619049690505, "rougeL_precision_stderr": 0.002233393033449764, "rougeL_recall": 0.23548259610722824, "rougeL_recall_stderr": 0.004438251763555299, "rougeLsum_fmeasure": 0.08427145597780734, "rougeLsum_fmeasure_stderr": 0.0019051123678010644, "rougeLsum_precision": 0.06406542591417572, "rougeLsum_precision_stderr": 0.0022429625274388077, "rougeLsum_recall": 0.234275763130725, "rougeLsum_recall_stderr": 0.00433154610375273}}, "1": {"PALM_prompt": {"bleu": 0.28781282710307465, "bleu_stderr": 0.01899808984283447, "rouge1_fmeasure": 0.07847336913595586, "rouge1_fmeasure_stderr": 0.001535955643926011, "rouge1_precision": 0.0527754711256334, "rouge1_precision_stderr": 0.0014904713251823198, "rouge1_recall": 0.2537614091915221, "rouge1_recall_stderr": 0.004702310798072158, "rouge2_fmeasure": 0.032657251493622856, "rouge2_fmeasure_stderr": 0.0009264643374386928, "rouge2_precision": 0.021533529321543874, "rouge2_precision_stderr": 0.0007685776439012483, "rouge2_recall": 0.10966078271884003, "rouge2_recall_stderr": 0.002981675456939165, "rougeL_fmeasure": 0.07228685200884048, "rougeL_fmeasure_stderr": 0.0014209363141639564, "rougeL_precision": 0.04876649614656279, "rougeL_precision_stderr": 0.001420498632004972, "rougeL_recall": 0.23339792109691904, "rougeL_recall_stderr": 0.004315010087105858, "rougeLsum_fmeasure": 0.07320160734011764, "rougeLsum_fmeasure_stderr": 0.0014251444099725329, "rougeLsum_precision": 0.04935178833491907, "rougeLsum_precision_stderr": 0.0014212538671699328, "rougeLsum_recall": 0.23635405366452086, "rougeLsum_recall_stderr": 0.00434221432817691}}, "2": {"PALM_prompt": {"bleu": 0.32085939271138914, "bleu_stderr": 0.023874716323242045, "rouge1_fmeasure": 0.08108986156959869, "rouge1_fmeasure_stderr": 0.0015435730709568757, "rouge1_precision": 0.05368960443919722, "rouge1_precision_stderr": 0.0013878849609328464, "rouge1_recall": 0.2687130245556709, "rouge1_recall_stderr": 0.004740106099310347, "rouge2_fmeasure": 0.03412133307095403, "rouge2_fmeasure_stderr": 0.0009323084416353588, "rouge2_precision": 0.022426372869437324, "rouge2_precision_stderr": 0.0008085489202082841, "rouge2_recall": 0.11689977539927107, "rouge2_recall_stderr": 0.00300061931368436, "rougeL_fmeasure": 0.07379515479031812, "rougeL_fmeasure_stderr": 0.0013763914362202537, "rougeL_precision": 0.048651633590719855, "rougeL_precision_stderr": 0.0011827185282768337, "rougeL_recall": 0.24511580579594355, "rougeL_recall_stderr": 0.004282778444187627, "rougeLsum_fmeasure": 0.07555165803520482, "rougeLsum_fmeasure_stderr": 0.0014213371826134968, "rougeLsum_precision": 0.05014569138865563, "rougeLsum_precision_stderr": 0.001314326894957353, "rougeLsum_recall": 0.24950401790874296, "rougeLsum_recall_stderr": 0.004286277514587859}}, "3": {"PALM_prompt": {"bleu": 0.328454678316601, "bleu_stderr": 0.022343422759414436, "rouge1_fmeasure": 0.07919929805647623, "rouge1_fmeasure_stderr": 0.001514394418998029, "rouge1_precision": 0.052008963484847605, "rouge1_precision_stderr": 0.0014633614953241854, "rouge1_recall": 0.26281409902133185, "rouge1_recall_stderr": 0.0047415561831233915, "rouge2_fmeasure": 0.032486553286374405, "rouge2_fmeasure_stderr": 0.0008957923404999381, "rouge2_precision": 0.02118860914793864, "rouge2_precision_stderr": 0.0008530949812868349, "rouge2_recall": 0.11276078198061254, "rouge2_recall_stderr": 0.0030219172592672325, "rougeL_fmeasure": 0.07148770019595055, "rougeL_fmeasure_stderr": 0.0013416340928285905, "rougeL_precision": 0.0471171164690475, "rougeL_precision_stderr": 0.0013827485067535008, "rougeL_recall": 0.23822249787189817, "rougeL_recall_stderr": 0.0042466165786672035, "rougeLsum_fmeasure": 0.07424172013111648, "rougeLsum_fmeasure_stderr": 0.0014133679260911725, "rougeLsum_precision": 0.04892298323961062, "rougeLsum_precision_stderr": 0.0014183478958578937, "rougeLsum_recall": 0.24590296884903542, "rougeLsum_recall_stderr": 0.004380487268920286}}, "4": {"PALM_prompt": {"bleu": 0.3319702594644372, "bleu_stderr": 0.017323146780773062, "rouge1_fmeasure": 0.08161632894859638, "rouge1_fmeasure_stderr": 0.0015256642009196088, "rouge1_precision": 0.05459708827196318, "rouge1_precision_stderr": 0.0015720228379579838, "rouge1_recall": 0.2657448353396512, "rouge1_recall_stderr": 0.004717475684567482, "rouge2_fmeasure": 0.03357767413194358, "rouge2_fmeasure_stderr": 0.0009162455741147543, "rouge2_precision": 0.023141351440564402, "rouge2_precision_stderr": 0.001127390810261633, "rouge2_recall": 0.11549040824815301, "rouge2_recall_stderr": 0.0030025248991349058, "rougeL_fmeasure": 0.07227592144254627, "rougeL_fmeasure_stderr": 0.0013148844913734015, "rougeL_precision": 0.04843785490759391, "rougeL_precision_stderr": 0.0014543602029517073, "rougeL_recall": 0.23813768049670572, "rougeL_recall_stderr": 0.004172909727083725, "rougeLsum_fmeasure": 0.07605405086627043, "rougeLsum_fmeasure_stderr": 0.0014106467606439447, "rougeLsum_precision": 0.05090666274679119, "rougeLsum_precision_stderr": 0.0014735025076296423, "rougeLsum_recall": 0.2482641520424661, "rougeLsum_recall_stderr": 0.004326751256652749}}, "5": {"PALM_prompt": {"bleu": 0.39182011395821026, "bleu_stderr": 0.03017462277769791, "rouge1_fmeasure": 0.08316112835678297, "rouge1_fmeasure_stderr": 0.0015044194584303333, "rouge1_precision": 0.05338210822991803, "rouge1_precision_stderr": 0.0011795913375033742, "rouge1_recall": 0.2739388133076789, "rouge1_recall_stderr": 0.004725041678049671, "rouge2_fmeasure": 0.03484163213544278, "rouge2_fmeasure_stderr": 0.0009120223523826239, "rouge2_precision": 0.02230990790026212, "rouge2_precision_stderr": 0.0007134756313875014, "rouge2_recall": 0.12067184027915072, "rouge2_recall_stderr": 0.003047769920528369, "rougeL_fmeasure": 0.07405669758488781, "rougeL_fmeasure_stderr": 0.0013146857723887232, "rougeL_precision": 0.04760001656977872, "rougeL_precision_stderr": 0.001056801997116071, "rougeL_recall": 0.2449561247042928, "rougeL_recall_stderr": 0.004191935654465999, "rougeLsum_fmeasure": 0.07747218411731929, "rougeLsum_fmeasure_stderr": 0.0013880210497301878, "rougeLsum_precision": 0.049818219801901514, "rougeLsum_precision_stderr": 0.0011057069363974176, "rougeLsum_recall": 0.25508548910812884, "rougeLsum_recall_stderr": 0.004349187676537093}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.2190291379439195, "bleu_stderr": 0.08836041456372522, "rouge1_fmeasure": 0.1723366320397076, "rouge1_fmeasure_stderr": 0.0016970728587596892, "rouge1_precision": 0.14881678764247983, "rouge1_precision_stderr": 0.0018075069170291314, "rouge1_recall": 0.24793312894988265, "rouge1_recall_stderr": 0.002389930611487624, "rouge2_fmeasure": 0.02968820163157077, "rouge2_fmeasure_stderr": 0.0007214568491876274, "rouge2_precision": 0.025628754354153325, "rouge2_precision_stderr": 0.0006556947869924073, "rouge2_recall": 0.04387904423436066, "rouge2_recall_stderr": 0.0012152943972142077, "rougeL_fmeasure": 0.12964957358415072, "rougeL_fmeasure_stderr": 0.001174103551409633, "rougeL_precision": 0.11061636395219109, "rougeL_precision_stderr": 0.0012170197578614795, "rougeL_recall": 0.19130257812101642, "rougeL_recall_stderr": 0.001903442450094291, "rougeLsum_fmeasure": 0.1606987702240205, "rougeLsum_fmeasure_stderr": 0.0015723044572643534, "rougeLsum_precision": 0.13872341402711671, "rougeLsum_precision_stderr": 0.0016795577613053013, "rougeLsum_recall": 0.23159850567749277, "rougeLsum_recall_stderr": 0.002229753265274432}}, "1": {"tldr_en": {"bleu": 1.5590008346037099, "bleu_stderr": 0.06892531048465908, "rouge1_fmeasure": 0.17711899758881897, "rouge1_fmeasure_stderr": 0.0017763415721639936, "rouge1_precision": 0.15240917543961252, "rouge1_precision_stderr": 0.001893453848440131, "rouge1_recall": 0.25542377808907146, "rouge1_recall_stderr": 0.0024641171624728577, "rouge2_fmeasure": 0.03374713766036158, "rouge2_fmeasure_stderr": 0.0007818322344438194, "rouge2_precision": 0.029132226950407722, "rouge2_precision_stderr": 0.000722011658200494, "rouge2_recall": 0.049639629425446356, "rouge2_recall_stderr": 0.0012773856244254617, "rougeL_fmeasure": 0.12974115857300988, "rougeL_fmeasure_stderr": 0.0011843934409556005, "rougeL_precision": 0.10994692166995118, "rougeL_precision_stderr": 0.0012260681075949413, "rougeL_recall": 0.19293230076900478, "rougeL_recall_stderr": 0.0019284923872095526, "rougeLsum_fmeasure": 0.16618151783978977, "rougeLsum_fmeasure_stderr": 0.0016552458293647842, "rougeLsum_precision": 0.1427583503702487, "rougeLsum_precision_stderr": 0.0017641069847062667, "rougeLsum_recall": 0.24069300754030848, "rougeLsum_recall_stderr": 0.0023353688459108405}}, "2": {"tldr_en": {"bleu": 1.423539576651847, "bleu_stderr": 0.05590338188617223, "rouge1_fmeasure": 0.17612683398478715, "rouge1_fmeasure_stderr": 0.0017563955053422117, "rouge1_precision": 0.15159610505617108, "rouge1_precision_stderr": 0.0018921710224610877, "rouge1_recall": 0.2536664028604043, "rouge1_recall_stderr": 0.0023916817331507876, "rouge2_fmeasure": 0.03193124516131047, "rouge2_fmeasure_stderr": 0.000758958083313296, "rouge2_precision": 0.02782910309662972, "rouge2_precision_stderr": 0.0007111400329440863, "rouge2_recall": 0.04643317452251163, "rouge2_recall_stderr": 0.0012211811473359306, "rougeL_fmeasure": 0.1305484526211359, "rougeL_fmeasure_stderr": 0.0011976224297953603, "rougeL_precision": 0.11083516090740873, "rougeL_precision_stderr": 0.0012614447636676077, "rougeL_recall": 0.19352563235261244, "rougeL_recall_stderr": 0.0019031906464486539, "rougeLsum_fmeasure": 0.1656855868051239, "rougeLsum_fmeasure_stderr": 0.0016384579347020886, "rougeLsum_precision": 0.1424531837738363, "rougeLsum_precision_stderr": 0.0017681228614650911, "rougeLsum_recall": 0.23940558197543957, "rougeLsum_recall_stderr": 0.0022600581442295}}, "3": {"tldr_en": {"bleu": 1.402481855726376, "bleu_stderr": 0.07496831085827607, "rouge1_fmeasure": 0.14896513024586858, "rouge1_fmeasure_stderr": 0.0020016614890125467, "rouge1_precision": 0.13298493032742092, "rouge1_precision_stderr": 0.0021599143965991448, "rouge1_recall": 0.214129162398553, "rouge1_recall_stderr": 0.0028318625372094723, "rouge2_fmeasure": 0.02730656796059889, "rouge2_fmeasure_stderr": 0.0007432758390663112, "rouge2_precision": 0.0244781955065012, "rouge2_precision_stderr": 0.0007307175719718521, "rouge2_recall": 0.03981635760280176, "rouge2_recall_stderr": 0.0012026016154760618, "rougeL_fmeasure": 0.11134915972896199, "rougeL_fmeasure_stderr": 0.00140777630827098, "rougeL_precision": 0.09875466672002745, "rougeL_precision_stderr": 0.001559084136737345, "rougeL_recall": 0.1644184900777515, "rougeL_recall_stderr": 0.00222028334382692, "rougeLsum_fmeasure": 0.1397033192660591, "rougeLsum_fmeasure_stderr": 0.0018672195336514297, "rougeLsum_precision": 0.12471488513914283, "rougeLsum_precision_stderr": 0.0020316307804283357, "rougeLsum_recall": 0.20148242502649036, "rougeLsum_recall_stderr": 0.0026760218524170916}}, "4": {"tldr_en": {"bleu": 0.3627379747836102, "bleu_stderr": 0.03354762768029023, "rouge1_fmeasure": 0.0495274627219381, "rouge1_fmeasure_stderr": 0.00169718420379995, "rouge1_precision": 0.04578189123199333, "rouge1_precision_stderr": 0.0017562670636657443, "rouge1_recall": 0.07399147773842517, "rouge1_recall_stderr": 0.002550315174376835, "rouge2_fmeasure": 0.009286374730690028, "rouge2_fmeasure_stderr": 0.00050108884216674, "rouge2_precision": 0.008690556943839151, "rouge2_precision_stderr": 0.0006452419871034267, "rouge2_recall": 0.014071929895195552, "rouge2_recall_stderr": 0.0008009026229828391, "rougeL_fmeasure": 0.03797030362668432, "rougeL_fmeasure_stderr": 0.0012710366329130882, "rougeL_precision": 0.035008115979705615, "rougeL_precision_stderr": 0.0013409826184435712, "rougeL_recall": 0.058241103416270305, "rougeL_recall_stderr": 0.0020319511583359808, "rougeLsum_fmeasure": 0.046311955140639516, "rougeLsum_fmeasure_stderr": 0.0015800586441838697, "rougeLsum_precision": 0.042745554189029616, "rougeLsum_precision_stderr": 0.0016289097623771287, "rougeLsum_recall": 0.06929822143002932, "rougeLsum_recall_stderr": 0.002385334871151041}}, "5": {"tldr_en": {"bleu": 5.170172033055458e-07, "bleu_stderr": 1.1813622697325427e-06, "rouge1_fmeasure": 0.008032143708786618, "rouge1_fmeasure_stderr": 0.000769380549886739, "rouge1_precision": 0.0074834967426424225, "rouge1_precision_stderr": 0.0007736454980237687, "rouge1_recall": 0.011934633047410595, "rouge1_recall_stderr": 0.0011163746139347308, "rouge2_fmeasure": 0.0014060293109536969, "rouge2_fmeasure_stderr": 0.0002040774536152345, "rouge2_precision": 0.0011994561802445166, "rouge2_precision_stderr": 0.00018233396610689006, "rouge2_recall": 0.0022243917557991503, "rouge2_recall_stderr": 0.000328054783161663, "rougeL_fmeasure": 0.005954377693063202, "rougeL_fmeasure_stderr": 0.000556855926391102, "rougeL_precision": 0.005527948528114916, "rougeL_precision_stderr": 0.0005645889276529973, "rougeL_recall": 0.009193511694802203, "rougeL_recall_stderr": 0.0008680965592063552, "rougeLsum_fmeasure": 0.0075115815949656104, "rougeLsum_fmeasure_stderr": 0.0007197306094579381, "rougeLsum_precision": 0.007022799151439734, "rougeLsum_precision_stderr": 0.0007312149938921309, "rougeLsum_recall": 0.011189580936988842, "rougeLsum_recall_stderr": 0.0010462966465602747}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.023059028483234455, "bleu_stderr": 0.009986858835187516, "rouge1_fmeasure": 0.038140802367729314, "rouge1_fmeasure_stderr": 0.001495094420064931, "rouge1_precision": 0.08646635544730007, "rouge1_precision_stderr": 0.00377831577985332, "rouge1_recall": 0.031635634606258116, "rouge1_recall_stderr": 0.001269300288541845, "rouge2_fmeasure": 0.011993223757428687, "rouge2_fmeasure_stderr": 0.0006456302396314265, "rouge2_precision": 0.03990955933185571, "rouge2_precision_stderr": 0.0024489170391253133, "rouge2_recall": 0.00853219303645261, "rouge2_recall_stderr": 0.00046389097916627487, "rougeL_fmeasure": 0.034369983243126824, "rougeL_fmeasure_stderr": 0.0013496596592950014, "rougeL_precision": 0.07881038410549088, "rougeL_precision_stderr": 0.0035148627119781285, "rougeL_recall": 0.028615455542499727, "rougeL_recall_stderr": 0.0011483835890292063, "rougeLsum_fmeasure": 0.033892840605688854, "rougeLsum_fmeasure_stderr": 0.0013502083491247366, "rougeLsum_precision": 0.07924093489385359, "rougeLsum_precision_stderr": 0.0035579093389609888, "rougeLsum_recall": 0.027741907284705433, "rougeLsum_recall_stderr": 0.0011204355268068656}}, "1": {"generate_text_restaurant": {"bleu": 5.92327601668373, "bleu_stderr": 0.05843145852320597, "rouge1_fmeasure": 0.3195090019700737, "rouge1_fmeasure_stderr": 0.0019316739490464164, "rouge1_precision": 0.3069015502240498, "rouge1_precision_stderr": 0.0027141658342019533, "rouge1_recall": 0.39979069436919706, "rouge1_recall_stderr": 0.0027344739468908464, "rouge2_fmeasure": 0.12124769523896647, "rouge2_fmeasure_stderr": 0.0013611141408615495, "rouge2_precision": 0.11881015634283494, "rouge2_precision_stderr": 0.0018726653522764317, "rouge2_recall": 0.1547177292472664, "rouge2_recall_stderr": 0.0018688850569839306, "rougeL_fmeasure": 0.24042839740750466, "rougeL_fmeasure_stderr": 0.0014957834627688047, "rougeL_precision": 0.2310708605355665, "rougeL_precision_stderr": 0.0022062598471417403, "rougeL_recall": 0.3039710432903314, "rougeL_recall_stderr": 0.002265711626940462, "rougeLsum_fmeasure": 0.26693221189807087, "rougeLsum_fmeasure_stderr": 0.0017924495261329944, "rougeLsum_precision": 0.2575158229010334, "rougeLsum_precision_stderr": 0.002504168232503219, "rougeLsum_recall": 0.33420271307698657, "rougeLsum_recall_stderr": 0.002509091259792972}}, "2": {"generate_text_restaurant": {"bleu": 5.798513972951498, "bleu_stderr": 0.11353083630417822, "rouge1_fmeasure": 0.30806587260671714, "rouge1_fmeasure_stderr": 0.0018509005121755077, "rouge1_precision": 0.27602836621141386, "rouge1_precision_stderr": 0.0025780345869436143, "rouge1_recall": 0.4181131170949761, "rouge1_recall_stderr": 0.0026506272040465527, "rouge2_fmeasure": 0.12337486765629936, "rouge2_fmeasure_stderr": 0.0013085936094396561, "rouge2_precision": 0.11242493035118595, "rouge2_precision_stderr": 0.0017273889338398733, "rouge2_recall": 0.17096478516816419, "rouge2_recall_stderr": 0.0019293105165237693, "rougeL_fmeasure": 0.24343008869727828, "rougeL_fmeasure_stderr": 0.0014161383440201198, "rougeL_precision": 0.21692521379325555, "rougeL_precision_stderr": 0.0020430932459005492, "rougeL_recall": 0.33431954510893935, "rougeL_recall_stderr": 0.0022474731694641457, "rougeLsum_fmeasure": 0.2593626081415107, "rougeLsum_fmeasure_stderr": 0.0017672461865662792, "rougeLsum_precision": 0.23257813200591104, "rougeLsum_precision_stderr": 0.0023360478957229073, "rougeLsum_recall": 0.3524929035089362, "rougeLsum_recall_stderr": 0.0025454158780705265}}, "3": {"generate_text_restaurant": {"bleu": 5.644092780950039, "bleu_stderr": 0.10217788685749982, "rouge1_fmeasure": 0.2981344592034621, "rouge1_fmeasure_stderr": 0.0018206530175075195, "rouge1_precision": 0.26161576269851167, "rouge1_precision_stderr": 0.0025136188998387504, "rouge1_recall": 0.41515437679947936, "rouge1_recall_stderr": 0.002598826549494006, "rouge2_fmeasure": 0.11947929128220935, "rouge2_fmeasure_stderr": 0.0012973693582640367, "rouge2_precision": 0.10693721487632077, "rouge2_precision_stderr": 0.0017057516502692433, "rouge2_recall": 0.16981690105478955, "rouge2_recall_stderr": 0.0019012605105245895, "rougeL_fmeasure": 0.23991261995087904, "rougeL_fmeasure_stderr": 0.0014219136572907404, "rougeL_precision": 0.2094840503016106, "rougeL_precision_stderr": 0.002037886584044074, "rougeL_recall": 0.3376907481718358, "rougeL_recall_stderr": 0.00220926835759776, "rougeLsum_fmeasure": 0.25177947103229636, "rougeLsum_fmeasure_stderr": 0.001736956932091685, "rougeLsum_precision": 0.22116618474928101, "rougeLsum_precision_stderr": 0.00229609611848074, "rougeLsum_recall": 0.35126017567747847, "rougeLsum_recall_stderr": 0.002506017472827367}}, "4": {"generate_text_restaurant": {"bleu": 5.7499537608526206, "bleu_stderr": 0.0771735259601375, "rouge1_fmeasure": 0.297032269913346, "rouge1_fmeasure_stderr": 0.0018374797196724821, "rouge1_precision": 0.25565023567980505, "rouge1_precision_stderr": 0.0024296319398495005, "rouge1_recall": 0.4223930509739377, "rouge1_recall_stderr": 0.0025959915251734665, "rouge2_fmeasure": 0.12065447384924378, "rouge2_fmeasure_stderr": 0.001292230076177851, "rouge2_precision": 0.10591522249436582, "rouge2_precision_stderr": 0.001656138422232947, "rouge2_recall": 0.17476583770251305, "rouge2_recall_stderr": 0.0019174634136014039, "rougeL_fmeasure": 0.2401166198393427, "rougeL_fmeasure_stderr": 0.001412545210957851, "rougeL_precision": 0.2057296852438049, "rougeL_precision_stderr": 0.0019458009062281374, "rougeL_recall": 0.3452387295232376, "rougeL_recall_stderr": 0.0022232954316674606, "rougeLsum_fmeasure": 0.2520913436920952, "rougeLsum_fmeasure_stderr": 0.001756285809527599, "rougeLsum_precision": 0.2170829438014025, "rougeLsum_precision_stderr": 0.0022139919637352325, "rougeLsum_recall": 0.359511646806021, "rougeLsum_recall_stderr": 0.0025629445270113453}}, "5": {"generate_text_restaurant": {"bleu": 5.770537159308962, "bleu_stderr": 0.1190361381685094, "rouge1_fmeasure": 0.2987490942442688, "rouge1_fmeasure_stderr": 0.00182958925425156, "rouge1_precision": 0.25787672074394796, "rouge1_precision_stderr": 0.0025328256284091236, "rouge1_recall": 0.42573900503618045, "rouge1_recall_stderr": 0.0025754554062627877, "rouge2_fmeasure": 0.12169295522428568, "rouge2_fmeasure_stderr": 0.0012994307062877601, "rouge2_precision": 0.10790420126833489, "rouge2_precision_stderr": 0.001769950634717068, "rouge2_recall": 0.1764978054536251, "rouge2_recall_stderr": 0.001953358091932576, "rougeL_fmeasure": 0.24138350753763696, "rougeL_fmeasure_stderr": 0.0014118485855993332, "rougeL_precision": 0.207955556140787, "rougeL_precision_stderr": 0.002097923926132232, "rougeL_recall": 0.3476137840160232, "rougeL_recall_stderr": 0.002207282217829847, "rougeLsum_fmeasure": 0.2537764861825883, "rougeLsum_fmeasure_stderr": 0.0017644696653914508, "rougeLsum_precision": 0.21954740035518447, "rougeLsum_precision_stderr": 0.0023503093866769544, "rougeLsum_recall": 0.3624191463006945, "rougeLsum_recall_stderr": 0.0025392023747063696}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.2602613828624476, "bleu_stderr": 0.08741245069026914, "rouge1_fmeasure": 0.1924128186381312, "rouge1_fmeasure_stderr": 0.002360900852656541, "rouge1_precision": 0.14542424202725895, "rouge1_precision_stderr": 0.0022138246399507205, "rouge1_recall": 0.31877105379992854, "rouge1_recall_stderr": 0.0039014668311384846, "rouge2_fmeasure": 0.035715714855404174, "rouge2_fmeasure_stderr": 0.0012470772810957468, "rouge2_precision": 0.026751288404993658, "rouge2_precision_stderr": 0.0010068959458770191, "rouge2_recall": 0.06119647795475897, "rouge2_recall_stderr": 0.0021992283140675147, "rougeL_fmeasure": 0.14397207180406998, "rougeL_fmeasure_stderr": 0.0017392037354323953, "rougeL_precision": 0.10850993070385385, "rougeL_precision_stderr": 0.0016022951483510026, "rougeL_recall": 0.2403257780307599, "rougeL_recall_stderr": 0.0030478006648468224, "rougeLsum_fmeasure": 0.1513854308550901, "rougeLsum_fmeasure_stderr": 0.0018706736809661465, "rougeLsum_precision": 0.1137602974676654, "rougeLsum_precision_stderr": 0.0016663613584011713, "rougeLsum_recall": 0.25349408376272603, "rougeLsum_recall_stderr": 0.0033388300752575585}}, "1": {"article_DOC_summary": {"bleu": 0.7915703643644384, "bleu_stderr": 0.08396451150549139, "rouge1_fmeasure": 0.14848707861095392, "rouge1_fmeasure_stderr": 0.0020468594975290248, "rouge1_precision": 0.10549993650520251, "rouge1_precision_stderr": 0.00153501677078187, "rouge1_recall": 0.2612212727377519, "rouge1_recall_stderr": 0.0034404286739595498, "rouge2_fmeasure": 0.01983861975775417, "rouge2_fmeasure_stderr": 0.0009966264701985932, "rouge2_precision": 0.013994761205987642, "rouge2_precision_stderr": 0.0007149071339383721, "rouge2_recall": 0.0356140526531422, "rouge2_recall_stderr": 0.0017994780886659853, "rougeL_fmeasure": 0.11531599073392822, "rougeL_fmeasure_stderr": 0.0015026013618598068, "rougeL_precision": 0.08181009058637802, "rougeL_precision_stderr": 0.0011239080238855375, "rougeL_recall": 0.20392678730897415, "rougeL_recall_stderr": 0.002600805826506937, "rougeLsum_fmeasure": 0.12077280177911864, "rougeLsum_fmeasure_stderr": 0.0016322822837075467, "rougeLsum_precision": 0.08559803726047839, "rougeLsum_precision_stderr": 0.001213987918870468, "rougeLsum_recall": 0.21400310748327384, "rougeLsum_recall_stderr": 0.0028528494274868274}}, "2": {"article_DOC_summary": {"bleu": 0.6502670718184665, "bleu_stderr": 0.05324899628422249, "rouge1_fmeasure": 0.14783482736166878, "rouge1_fmeasure_stderr": 0.001930898165701915, "rouge1_precision": 0.10471570168180548, "rouge1_precision_stderr": 0.0014494215119621229, "rouge1_recall": 0.2620545799252738, "rouge1_recall_stderr": 0.003320038801060601, "rouge2_fmeasure": 0.018873329322073275, "rouge2_fmeasure_stderr": 0.0008955667212919246, "rouge2_precision": 0.01319945934793176, "rouge2_precision_stderr": 0.0006302627050860287, "rouge2_recall": 0.03471557162965618, "rouge2_recall_stderr": 0.0016776406415917023, "rougeL_fmeasure": 0.11600786897853718, "rougeL_fmeasure_stderr": 0.0014481058046010048, "rougeL_precision": 0.08197306181617371, "rougeL_precision_stderr": 0.0010777654445218213, "rougeL_recall": 0.2071426347373322, "rougeL_recall_stderr": 0.0026041548046999877, "rougeLsum_fmeasure": 0.12019939004505038, "rougeLsum_fmeasure_stderr": 0.0016060029611780855, "rougeLsum_precision": 0.08489744619220965, "rougeLsum_precision_stderr": 0.0011830647260639108, "rougeLsum_recall": 0.21467503234909532, "rougeLsum_recall_stderr": 0.002893408444556316}}, "3": {"article_DOC_summary": {"bleu": 0.72650775578876, "bleu_stderr": 0.07009722650167388, "rouge1_fmeasure": 0.1434515966047625, "rouge1_fmeasure_stderr": 0.0021396059501441697, "rouge1_precision": 0.10410860827262407, "rouge1_precision_stderr": 0.0016985601546784064, "rouge1_recall": 0.24975935094410306, "rouge1_recall_stderr": 0.0036359468821554417, "rouge2_fmeasure": 0.01863408799342264, "rouge2_fmeasure_stderr": 0.0009121268268702102, "rouge2_precision": 0.0133838272101195, "rouge2_precision_stderr": 0.0006651947823416613, "rouge2_recall": 0.032957650415980116, "rouge2_recall_stderr": 0.0016410836459370027, "rougeL_fmeasure": 0.11028077942863275, "rougeL_fmeasure_stderr": 0.0015625007588984398, "rougeL_precision": 0.07992461082726765, "rougeL_precision_stderr": 0.0012408675788602088, "rougeL_recall": 0.1932235805685923, "rougeL_recall_stderr": 0.00277498209308085, "rougeLsum_fmeasure": 0.11596810997110246, "rougeLsum_fmeasure_stderr": 0.001710823422300248, "rougeLsum_precision": 0.0839932835001092, "rougeLsum_precision_stderr": 0.0013382454039087637, "rougeLsum_recall": 0.20290901214848292, "rougeLsum_recall_stderr": 0.0029990659468279056}}, "4": {"article_DOC_summary": {"bleu": 0.27256554319567566, "bleu_stderr": 0.05393365990560443, "rouge1_fmeasure": 0.037884638019230664, "rouge1_fmeasure_stderr": 0.00214775480739452, "rouge1_precision": 0.03133602840154907, "rouge1_precision_stderr": 0.001987959380677703, "rouge1_recall": 0.06067401952247452, "rouge1_recall_stderr": 0.003487892178028924, "rouge2_fmeasure": 0.0043759041403374135, "rouge2_fmeasure_stderr": 0.0005183680894634575, "rouge2_precision": 0.0034573763117096636, "rouge2_precision_stderr": 0.00044354666596204615, "rouge2_recall": 0.007156768365840787, "rouge2_recall_stderr": 0.0008508883614159644, "rougeL_fmeasure": 0.029266330660064416, "rougeL_fmeasure_stderr": 0.0016348070626843912, "rougeL_precision": 0.024472567308614246, "rougeL_precision_stderr": 0.0015926598243951066, "rougeL_recall": 0.04698578958663985, "rougeL_recall_stderr": 0.002673075415704531, "rougeLsum_fmeasure": 0.031041105487741426, "rougeLsum_fmeasure_stderr": 0.0017460208416643014, "rougeLsum_precision": 0.0257721881730792, "rougeLsum_precision_stderr": 0.0016575889068278311, "rougeLsum_recall": 0.04994885638600292, "rougeLsum_recall_stderr": 0.0028614395409444103}}, "5": {"article_DOC_summary": {"bleu": 2.5634857131422677e-38, "bleu_stderr": 1.7875744611015253e-32, "rouge1_fmeasure": 0.0022183238269151938, "rouge1_fmeasure_stderr": 0.0006462435715584798, "rouge1_precision": 0.002422654460959852, "rouge1_precision_stderr": 0.000701445835208553, "rouge1_recall": 0.002150434002930073, "rouge1_recall_stderr": 0.0006364013868075673, "rouge2_fmeasure": 0.00044144904818645863, "rouge2_fmeasure_stderr": 0.00024927107535141214, "rouge2_precision": 0.00047185826875061065, "rouge2_precision_stderr": 0.00025359131866297053, "rouge2_recall": 0.00042238421955403087, "rouge2_recall_stderr": 0.00024978354101036374, "rougeL_fmeasure": 0.0018677137784396751, "rougeL_fmeasure_stderr": 0.0005453913617070764, "rougeL_precision": 0.0020288572682842206, "rougeL_precision_stderr": 0.000585169484066717, "rougeL_recall": 0.0018274673120388537, "rougeL_recall_stderr": 0.0005474767964183582, "rougeLsum_fmeasure": 0.0019066970935807948, "rougeLsum_fmeasure_stderr": 0.0005494437621613826, "rougeLsum_precision": 0.00207399584371078, "rougeLsum_precision_stderr": 0.0005893776256546286, "rougeLsum_recall": 0.001865187279004104, "rougeLsum_recall_stderr": 0.0005528638398211417}}}} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3141fd46741c191638eda02c82130dadd8d8c026 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.32012773562587393, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.018886919871708343 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06825136821356759, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00237062733299883 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2508286238498341, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004661697991334146 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.0899762528447479, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020354843345656163 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.030615387870315716, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0016384196683051863 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11248984628302856, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0030543468265705285 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03944916755986983, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001249719129780461 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06342619049690505, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.002233393033449764 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.23548259610722824, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004438251763555299 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.08360285576779355, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018856928971255989 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06406542591417572, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0022429625274388077 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.234275763130725, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00433154610375273 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.08427145597780734, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019051123678010644 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ed5c7696ec719ee008e5c137cc8a882b9aca10fc --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.28781282710307465, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.01899808984283447 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0527754711256334, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014904713251823198 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2537614091915221, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004702310798072158 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.07847336913595586, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001535955643926011 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.021533529321543874, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007685776439012483 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.10966078271884003, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.002981675456939165 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.032657251493622856, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009264643374386928 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.04876649614656279, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001420498632004972 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.23339792109691904, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004315010087105858 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07228685200884048, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014209363141639564 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.04935178833491907, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014212538671699328 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.23635405366452086, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00434221432817691 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07320160734011764, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014251444099725329 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..926abef81629ca372e21e10c43e546f0a081968b --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.32085939271138914, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.023874716323242045 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05368960443919722, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013878849609328464 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2687130245556709, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004740106099310347 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08108986156959869, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0015435730709568757 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.022426372869437324, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008085489202082841 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11689977539927107, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00300061931368436 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03412133307095403, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009323084416353588 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.048651633590719855, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011827185282768337 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24511580579594355, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004282778444187627 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07379515479031812, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013763914362202537 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05014569138865563, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001314326894957353 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.24950401790874296, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004286277514587859 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07555165803520482, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014213371826134968 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f8632197ef238ffaa1519be29c276bd57a760ba2 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.328454678316601, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.022343422759414436 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.052008963484847605, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014633614953241854 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.26281409902133185, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0047415561831233915 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.07919929805647623, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001514394418998029 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02118860914793864, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008530949812868349 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11276078198061254, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0030219172592672325 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.032486553286374405, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008957923404999381 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0471171164690475, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013827485067535008 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.23822249787189817, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0042466165786672035 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07148770019595055, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013416340928285905 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.04892298323961062, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014183478958578937 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.24590296884903542, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004380487268920286 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07424172013111648, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014133679260911725 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a6f077a66de04a3cc9fb1d403d7d8470bc593418 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.3319702594644372, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.017323146780773062 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05459708827196318, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015720228379579838 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2657448353396512, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004717475684567482 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08161632894859638, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0015256642009196088 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.023141351440564402, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001127390810261633 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11549040824815301, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0030025248991349058 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03357767413194358, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009162455741147543 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.04843785490759391, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014543602029517073 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.23813768049670572, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004172909727083725 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07227592144254627, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013148844913734015 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.05090666274679119, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014735025076296423 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2482641520424661, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004326751256652749 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07605405086627043, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014106467606439447 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..07818a934bf3777e0006fcff119d1ad66991da47 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.39182011395821026, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03017462277769791 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05338210822991803, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011795913375033742 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2739388133076789, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004725041678049671 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.08316112835678297, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0015044194584303333 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02230990790026212, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007134756313875014 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.12067184027915072, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003047769920528369 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03484163213544278, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009120223523826239 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.04760001656977872, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001056801997116071 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2449561247042928, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004191935654465999 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07405669758488781, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013146857723887232 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.049818219801901514, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0011057069363974176 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25508548910812884, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004349187676537093 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07747218411731929, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0013880210497301878 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d809bbce47e34c48b5750fc934cda27bb3271eb4 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14881678764247983, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018075069170291314 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.24793312894988265, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002389930611487624 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1723366320397076, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016970728587596892 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.025628754354153325, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006556947869924073 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04387904423436066, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012152943972142077 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.02968820163157077, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007214568491876274 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11061636395219109, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012170197578614795 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19130257812101642, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.001903442450094291 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12964957358415072, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001174103551409633 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13872341402711671, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016795577613053013 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23159850567749277, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002229753265274432 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1606987702240205, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015723044572643534 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.2190291379439195, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08836041456372522 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..7b008c2c532e1f9c677ad52e16a21e4076aa0cfd --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15240917543961252, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001893453848440131 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.25542377808907146, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0024641171624728577 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17711899758881897, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017763415721639936 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.029132226950407722, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000722011658200494 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.049639629425446356, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012773856244254617 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03374713766036158, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007818322344438194 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10994692166995118, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012260681075949413 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19293230076900478, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019284923872095526 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12974115857300988, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0011843934409556005 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1427583503702487, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017641069847062667 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24069300754030848, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023353688459108405 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16618151783978977, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016552458293647842 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5590008346037099, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06892531048465908 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..0e679f58768a1e02b0ceb3a8d78ffe1eb09915f0 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15159610505617108, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018921710224610877 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2536664028604043, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0023916817331507876 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17612683398478715, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017563955053422117 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.02782910309662972, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007111400329440863 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04643317452251163, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012211811473359306 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03193124516131047, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000758958083313296 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11083516090740873, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012614447636676077 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19352563235261244, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019031906464486539 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1305484526211359, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0011976224297953603 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1424531837738363, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017681228614650911 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23940558197543957, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0022600581442295 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1656855868051239, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016384579347020886 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.423539576651847, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05590338188617223 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..133a5d4bc2f15becde469d5a9aff0016dd4d69a9 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.13298493032742092, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0021599143965991448 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.214129162398553, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028318625372094723 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.14896513024586858, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020016614890125467 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0244781955065012, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007307175719718521 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.03981635760280176, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012026016154760618 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.02730656796059889, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007432758390663112 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.09875466672002745, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001559084136737345 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1644184900777515, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00222028334382692 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.11134915972896199, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00140777630827098 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.12471488513914283, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020316307804283357 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.20148242502649036, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026760218524170916 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1397033192660591, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018672195336514297 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.402481855726376, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07496831085827607 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a8ddaf5685a1528534bde0489351637fd48ab637 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.04578189123199333, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017562670636657443 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07399147773842517, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002550315174376835 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.0495274627219381, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00169718420379995 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.008690556943839151, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006452419871034267 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.014071929895195552, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0008009026229828391 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.009286374730690028, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00050108884216674 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.035008115979705615, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013409826184435712 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.058241103416270305, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020319511583359808 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.03797030362668432, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012710366329130882 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.042745554189029616, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016289097623771287 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.06929822143002932, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002385334871151041 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.046311955140639516, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0015800586441838697 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.3627379747836102, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03354762768029023 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e8174f4cd748334c6cde9dc5a4fca3d3aa02c077 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.0074834967426424225, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0007736454980237687 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.011934633047410595, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0011163746139347308 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.008032143708786618, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.000769380549886739 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0011994561802445166, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00018233396610689006 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0022243917557991503, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.000328054783161663 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0014060293109536969, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0002040774536152345 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.005527948528114916, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0005645889276529973 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.009193511694802203, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0008680965592063552 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.005954377693063202, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.000556855926391102 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.007022799151439734, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007312149938921309 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.011189580936988842, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0010462966465602747 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.0075115815949656104, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007197306094579381 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 5.170172033055458e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.1813622697325427e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..40f1523c48a420bab1ba4f12a9d0956dffaebcbe --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.023059028483234455, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.009986858835187516 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.08646635544730007, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00377831577985332 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.031635634606258116, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.001269300288541845 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.038140802367729314, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001495094420064931 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.03990955933185571, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0024489170391253133 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.00853219303645261, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00046389097916627487 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.011993223757428687, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0006456302396314265 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.07881038410549088, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0035148627119781285 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.028615455542499727, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0011483835890292063 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.034369983243126824, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0013496596592950014 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.07924093489385359, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0035579093389609888 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.027741907284705433, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0011204355268068656 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.033892840605688854, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0013502083491247366 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..879974954d470b7900d1a1cdd9a334662c5aa0a6 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.92327601668373, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.05843145852320597 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3069015502240498, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0027141658342019533 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.39979069436919706, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027344739468908464 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3195090019700737, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019316739490464164 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.11881015634283494, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0018726653522764317 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1547177292472664, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0018688850569839306 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.12124769523896647, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0013611141408615495 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2310708605355665, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0022062598471417403 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3039710432903314, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002265711626940462 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.24042839740750466, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014957834627688047 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2575158229010334, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002504168232503219 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.33420271307698657, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002509091259792972 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.26693221189807087, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017924495261329944 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a14838e82b3b95e5a0458c3a06a560c39a0e04b2 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.798513972951498, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.11353083630417822 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.27602836621141386, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0025780345869436143 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4181131170949761, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026506272040465527 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.30806587260671714, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018509005121755077 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.11242493035118595, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017273889338398733 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.17096478516816419, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019293105165237693 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.12337486765629936, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0013085936094396561 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.21692521379325555, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0020430932459005492 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33431954510893935, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022474731694641457 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.24343008869727828, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014161383440201198 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.23257813200591104, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0023360478957229073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3524929035089362, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025454158780705265 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2593626081415107, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017672461865662792 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..dd13cce32d2c45535d06cfb52fce3d1e0c094c08 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.644092780950039, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.10217788685749982 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.26161576269851167, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0025136188998387504 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.41515437679947936, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002598826549494006 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.2981344592034621, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018206530175075195 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.10693721487632077, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017057516502692433 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.16981690105478955, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019012605105245895 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.11947929128220935, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0012973693582640367 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2094840503016106, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002037886584044074 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3376907481718358, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.00220926835759776 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.23991261995087904, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014219136572907404 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.22116618474928101, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00229609611848074 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.35126017567747847, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002506017472827367 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.25177947103229636, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001736956932091685 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..3d19f6806d274182cd3ce8920e2252a61982fd5e --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.7499537608526206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.0771735259601375 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.25565023567980505, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0024296319398495005 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4223930509739377, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025959915251734665 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.297032269913346, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018374797196724821 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.10591522249436582, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.001656138422232947 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.17476583770251305, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019174634136014039 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.12065447384924378, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001292230076177851 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2057296852438049, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0019458009062281374 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3452387295232376, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022232954316674606 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2401166198393427, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001412545210957851 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2170829438014025, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0022139919637352325 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.359511646806021, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025629445270113453 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2520913436920952, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001756285809527599 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9ee712e1d6ce6fa69ce3395274b2193e7ee8cebc --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.770537159308962, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1190361381685094 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.25787672074394796, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0025328256284091236 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.42573900503618045, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025754554062627877 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.2987490942442688, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00182958925425156 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.10790420126833489, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.001769950634717068 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1764978054536251, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001953358091932576 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.12169295522428568, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0012994307062877601 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.207955556140787, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002097923926132232 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3476137840160232, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002207282217829847 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.24138350753763696, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014118485855993332 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.21954740035518447, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0023503093866769544 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3624191463006945, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025392023747063696 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2537764861825883, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017644696653914508 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_0.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..968d72c0ab62b25fadc80ca4a5466c82260a659f --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.14542424202725895, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0022138246399507205 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.31877105379992854, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0039014668311384846 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1924128186381312, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002360900852656541 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.026751288404993658, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010068959458770191 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06119647795475897, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0021992283140675147 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.035715714855404174, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012470772810957468 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10850993070385385, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0016022951483510026 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2403257780307599, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0030478006648468224 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14397207180406998, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017392037354323953 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.1137602974676654, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016663613584011713 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.25349408376272603, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0033388300752575585 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1513854308550901, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018706736809661465 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.2602613828624476, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08741245069026914 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_1.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..50dbd688f7944d2fce6db10f5bf692fbe4daefaf --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10549993650520251, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.00153501677078187 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2612212727377519, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0034404286739595498 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.14848707861095392, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0020468594975290248 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.013994761205987642, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007149071339383721 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0356140526531422, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0017994780886659853 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.01983861975775417, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009966264701985932 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08181009058637802, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0011239080238855375 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20392678730897415, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002600805826506937 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11531599073392822, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0015026013618598068 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08559803726047839, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001213987918870468 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.21400310748327384, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0028528494274868274 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12077280177911864, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0016322822837075467 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7915703643644384, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08396451150549139 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_2.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8f1a6011848d039ff4d0935533aaca02fe69854e --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10471570168180548, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0014494215119621229 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2620545799252738, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003320038801060601 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.14783482736166878, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.001930898165701915 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01319945934793176, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006302627050860287 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.03471557162965618, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0016776406415917023 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.018873329322073275, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0008955667212919246 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08197306181617371, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0010777654445218213 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2071426347373322, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0026041548046999877 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11600786897853718, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0014481058046010048 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08489744619220965, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0011830647260639108 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.21467503234909532, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.002893408444556316 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12019939004505038, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0016060029611780855 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.6502670718184665, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.05324899628422249 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_3.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..54f4df3b84a493cf20a23b754af7e2bec866c4ec --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10410860827262407, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0016985601546784064 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.24975935094410306, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0036359468821554417 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1434515966047625, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0021396059501441697 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0133838272101195, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006651947823416613 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.032957650415980116, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0016410836459370027 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.01863408799342264, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009121268268702102 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.07992461082726765, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0012408675788602088 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.1932235805685923, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00277498209308085 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11028077942863275, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0015625007588984398 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0839932835001092, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0013382454039087637 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.20290901214848292, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0029990659468279056 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.11596810997110246, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.001710823422300248 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.72650775578876, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07009722650167388 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_4.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ac964276983edd051f98d999724fa98a7eb4c5c2 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.03133602840154907, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001987959380677703 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.06067401952247452, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003487892178028924 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.037884638019230664, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.00214775480739452 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0034573763117096636, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00044354666596204615 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.007156768365840787, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0008508883614159644 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.0043759041403374135, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0005183680894634575 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.024472567308614246, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0015926598243951066 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.04698578958663985, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002673075415704531 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.029266330660064416, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016348070626843912 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0257721881730792, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016575889068278311 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.04994885638600292, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0028614395409444103 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.031041105487741426, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017460208416643014 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.27256554319567566, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.05393365990560443 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_5.json b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c5d83d82560643a0e948a5e1141b6a5c424b43c7 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/generation/slim.4b284b1b9c4seed3_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.002422654460959852, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.000701445835208553 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.002150434002930073, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0006364013868075673 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0022183238269151938, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0006462435715584798 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00047185826875061065, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00025359131866297053 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00042238421955403087, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.00024978354101036374 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00044144904818645863, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00024927107535141214 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0020288572682842206, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.000585169484066717 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0018274673120388537, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0005474767964183582 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0018677137784396751, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0005453913617070764 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.00207399584371078, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0005893776256546286 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.001865187279004104, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0005528638398211417 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0019066970935807948, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0005494437621613826 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.5634857131422677e-38, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 1.7875744611015253e-32 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_0.csv b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..5014101fcd2062c0e632c5d0cfd738a978058d09 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.327,0.014842213153411242,0 +anli_r2,acc,0.334,0.014922019523732968,0 +anli_r3,acc,0.3358333333333333,0.013639261190932889,0 +arc_challenge,acc,0.24232081911262798,0.012521593295800115,0 +arc_challenge,acc_norm,0.2781569965870307,0.013094469919538793,0 +arc_easy,acc,0.494949494949495,0.010259260102565861,0 +arc_easy,acc_norm,0.44612794612794615,0.01020005782876501,0 +boolq,acc,0.45321100917431195,0.00870668126587249,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.36502627806975624,,1 +copa,acc,0.66,0.04760952285695238,0 +hellaswag,acc,0.3937462656841267,0.004875812021461996,0 +hellaswag,acc_norm,0.48994224258115915,0.004988771791854512,0 +piqa,acc,0.6969532100108814,0.010722648689531525,0 +piqa,acc_norm,0.7018498367791077,0.01067296411400829,0 +rte,acc,0.5595667870036101,0.02988212336311872,0 +sciq,acc,0.704,0.01444273494157502,0 +sciq,acc_norm,0.637,0.015213890444671283,0 +storycloze_2016,acc,0.6702298236237306,0.01087168247139514,0 +winogrande,acc,0.5303867403314917,0.014026510839428743,0 diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_0.json b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_0.json new file mode 100644 index 0000000000000000000000000000000000000000..060f8fee3d4c99c1e14a893bf660b71f0442aef0 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.327, + "acc_stderr": 0.014842213153411242 + }, + "anli_r2": { + "acc": 0.334, + "acc_stderr": 0.014922019523732968 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.013639261190932889 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.36502627806975624 + }, + "copa": { + "acc": 0.66, + "acc_stderr": 0.04760952285695238 + }, + "hellaswag": { + "acc": 0.3937462656841267, + "acc_stderr": 0.004875812021461996, + "acc_norm": 0.48994224258115915, + "acc_norm_stderr": 0.004988771791854512 + }, + "rte": { + "acc": 0.5595667870036101, + "acc_stderr": 0.02988212336311872 + }, + "winogrande": { + "acc": 0.5303867403314917, + "acc_stderr": 0.014026510839428743 + }, + "storycloze_2016": { + "acc": 0.6702298236237306, + "acc_stderr": 0.01087168247139514 + }, + "boolq": { + "acc": 0.45321100917431195, + "acc_stderr": 0.00870668126587249 + }, + "arc_easy": { + "acc": 0.494949494949495, + "acc_stderr": 0.010259260102565861, + "acc_norm": 0.44612794612794615, + "acc_norm_stderr": 0.01020005782876501 + }, + "arc_challenge": { + "acc": 0.24232081911262798, + "acc_stderr": 0.012521593295800115, + "acc_norm": 0.2781569965870307, + "acc_norm_stderr": 0.013094469919538793 + }, + "sciq": { + "acc": 0.704, + "acc_stderr": 0.01444273494157502, + "acc_norm": 0.637, + "acc_norm_stderr": 0.015213890444671283 + }, + "piqa": { + "acc": 0.6969532100108814, + "acc_stderr": 0.010722648689531525, + "acc_norm": 0.7018498367791077, + "acc_norm_stderr": 0.01067296411400829 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_1.csv b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..004598a1491b3cad414bfe80cc253ae2cd748557 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.328,0.014853842487270334,0 +anli_r2,acc,0.331,0.01488827258820393,0 +anli_r3,acc,0.3275,0.013553211167251944,0 +arc_challenge,acc,0.2568259385665529,0.0127669237941168,0 +arc_challenge,acc_norm,0.2721843003412969,0.013006600406423707,0 +arc_easy,acc,0.48863636363636365,0.010257133441117106,0 +arc_easy,acc_norm,0.4532828282828283,0.010214901516731618,0 +boolq,acc,0.44954128440366975,0.008700409761350806,1 +cb,acc,0.42857142857142855,0.06672848092813058,1 +cb,f1,0.29607401850462617,,1 +copa,acc,0.72,0.04512608598542127,0 +hellaswag,acc,0.39454291973710415,0.004877534215987093,0 +hellaswag,acc_norm,0.4898426608245369,0.004988751698341149,0 +piqa,acc,0.6833514689880305,0.010853160531978483,0 +piqa,acc_norm,0.6931447225244831,0.010760295070580374,0 +rte,acc,0.5523465703971119,0.029931070362939533,0 +sciq,acc,0.707,0.014399942998441268,0 +sciq,acc_norm,0.696,0.01455320568795043,0 +storycloze_2016,acc,0.6509887760555852,0.01102264051910855,0 +winogrande,acc,0.5272296764009471,0.014031631629827694,0 diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_1.json b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_1.json new file mode 100644 index 0000000000000000000000000000000000000000..adbfec8f3e64702d0234ab5a8b0a8f0e6bcf7978 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270334 + }, + "anli_r2": { + "acc": 0.331, + "acc_stderr": 0.01488827258820393 + }, + "anli_r3": { + "acc": 0.3275, + "acc_stderr": 0.013553211167251944 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.29607401850462617 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542127 + }, + "hellaswag": { + "acc": 0.39454291973710415, + "acc_stderr": 0.004877534215987093, + "acc_norm": 0.4898426608245369, + "acc_norm_stderr": 0.004988751698341149 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.029931070362939533 + }, + "winogrande": { + "acc": 0.5272296764009471, + "acc_stderr": 0.014031631629827694 + }, + "storycloze_2016": { + "acc": 0.6509887760555852, + "acc_stderr": 0.01102264051910855 + }, + "boolq": { + "acc": 0.44954128440366975, + "acc_stderr": 0.008700409761350806 + }, + "arc_easy": { + "acc": 0.48863636363636365, + "acc_stderr": 0.010257133441117106, + "acc_norm": 0.4532828282828283, + "acc_norm_stderr": 0.010214901516731618 + }, + "arc_challenge": { + "acc": 0.2568259385665529, + "acc_stderr": 0.0127669237941168, + "acc_norm": 0.2721843003412969, + "acc_norm_stderr": 0.013006600406423707 + }, + "sciq": { + "acc": 0.707, + "acc_stderr": 0.014399942998441268, + "acc_norm": 0.696, + "acc_norm_stderr": 0.01455320568795043 + }, + "piqa": { + "acc": 0.6833514689880305, + "acc_stderr": 0.010853160531978483, + "acc_norm": 0.6931447225244831, + "acc_norm_stderr": 0.010760295070580374 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_2.csv b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..2ac482d3dfebe04377a54decb8be08d4208478e7 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.317,0.014721675438880222,0 +anli_r2,acc,0.324,0.014806864733738857,0 +anli_r3,acc,0.32,0.013471620929769137,0 +arc_challenge,acc,0.24488054607508533,0.012566273985131356,0 +arc_challenge,acc_norm,0.28071672354948807,0.013131238126975586,0 +arc_easy,acc,0.492003367003367,0.01025847128984197,0 +arc_easy,acc_norm,0.45454545454545453,0.010217299762709435,0 +boolq,acc,0.4452599388379205,0.008692488322023064,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.36560846560846566,,1 +copa,acc,0.65,0.04793724854411019,0 +hellaswag,acc,0.3948416650069707,0.004878176541703575,0 +hellaswag,acc_norm,0.49083847839075884,0.0049889437217111995,0 +piqa,acc,0.6953210010881393,0.010738889044325161,0 +piqa,acc_norm,0.6958650707290533,0.010733493335721319,0 +rte,acc,0.48736462093862815,0.030086851767188564,0 +sciq,acc,0.722,0.014174516461485239,0 +sciq,acc_norm,0.702,0.014470846741134712,0 +storycloze_2016,acc,0.6563335114911811,0.010982724236255946,0 +winogrande,acc,0.5256511444356748,0.014033980956108562,0 diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_2.json b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_2.json new file mode 100644 index 0000000000000000000000000000000000000000..477812858deb0812d4ed8bc3268f4acecb9c7833 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.317, + "acc_stderr": 0.014721675438880222 + }, + "anli_r2": { + "acc": 0.324, + "acc_stderr": 0.014806864733738857 + }, + "anli_r3": { + "acc": 0.32, + "acc_stderr": 0.013471620929769137 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.36560846560846566 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.04793724854411019 + }, + "hellaswag": { + "acc": 0.3948416650069707, + "acc_stderr": 0.004878176541703575, + "acc_norm": 0.49083847839075884, + "acc_norm_stderr": 0.0049889437217111995 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5256511444356748, + "acc_stderr": 0.014033980956108562 + }, + "storycloze_2016": { + "acc": 0.6563335114911811, + "acc_stderr": 0.010982724236255946 + }, + "boolq": { + "acc": 0.4452599388379205, + "acc_stderr": 0.008692488322023064 + }, + "arc_easy": { + "acc": 0.492003367003367, + "acc_stderr": 0.01025847128984197, + "acc_norm": 0.45454545454545453, + "acc_norm_stderr": 0.010217299762709435 + }, + "arc_challenge": { + "acc": 0.24488054607508533, + "acc_stderr": 0.012566273985131356, + "acc_norm": 0.28071672354948807, + "acc_norm_stderr": 0.013131238126975586 + }, + "sciq": { + "acc": 0.722, + "acc_stderr": 0.014174516461485239, + "acc_norm": 0.702, + "acc_norm_stderr": 0.014470846741134712 + }, + "piqa": { + "acc": 0.6953210010881393, + "acc_stderr": 0.010738889044325161, + "acc_norm": 0.6958650707290533, + "acc_norm_stderr": 0.010733493335721319 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_3.csv b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..0af370e2e6c920a956ee307957017a673a85fe66 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.34,0.014987482264363937,0 +anli_r2,acc,0.375,0.015316971293620996,0 +anli_r3,acc,0.3358333333333333,0.013639261190932882,0 +arc_challenge,acc,0.23293515358361774,0.012352507042617394,0 +arc_challenge,acc_norm,0.26023890784982934,0.012821930225112556,0 +arc_easy,acc,0.4718013468013468,0.010243454104071792,0 +arc_easy,acc_norm,0.4553872053872054,0.010218861787618732,0 +boolq,acc,0.4504587155963303,0.008702022442950874,1 +cb,acc,0.5357142857142857,0.06724777654937658,1 +cb,f1,0.538474366304555,,1 +copa,acc,0.68,0.046882617226215034,0 +hellaswag,acc,0.3951404102768373,0.004878816961012042,0 +hellaswag,acc_norm,0.49372634933280224,0.0049893886134388,0 +piqa,acc,0.6920565832426551,0.010770892367463689,0 +piqa,acc_norm,0.6985854189336235,0.01070624824275376,0 +rte,acc,0.5090252707581228,0.030091559826331334,0 +sciq,acc,0.728,0.014078856992462615,0 +sciq,acc_norm,0.711,0.014341711358296183,0 +storycloze_2016,acc,0.6531266702298236,0.011006857922124124,0 +winogrande,acc,0.5343330702446725,0.014019317531542569,0 diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_3.json b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_3.json new file mode 100644 index 0000000000000000000000000000000000000000..210f8443ed32f51d86bfaa16ab8d3b29f4b59404 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r2": { + "acc": 0.375, + "acc_stderr": 0.015316971293620996 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.013639261190932882 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.538474366304555 + }, + "copa": { + "acc": 0.68, + "acc_stderr": 0.046882617226215034 + }, + "hellaswag": { + "acc": 0.3951404102768373, + "acc_stderr": 0.004878816961012042, + "acc_norm": 0.49372634933280224, + "acc_norm_stderr": 0.0049893886134388 + }, + "rte": { + "acc": 0.5090252707581228, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5343330702446725, + "acc_stderr": 0.014019317531542569 + }, + "storycloze_2016": { + "acc": 0.6531266702298236, + "acc_stderr": 0.011006857922124124 + }, + "boolq": { + "acc": 0.4504587155963303, + "acc_stderr": 0.008702022442950874 + }, + "arc_easy": { + "acc": 0.4718013468013468, + "acc_stderr": 0.010243454104071792, + "acc_norm": 0.4553872053872054, + "acc_norm_stderr": 0.010218861787618732 + }, + "arc_challenge": { + "acc": 0.23293515358361774, + "acc_stderr": 0.012352507042617394, + "acc_norm": 0.26023890784982934, + "acc_norm_stderr": 0.012821930225112556 + }, + "sciq": { + "acc": 0.728, + "acc_stderr": 0.014078856992462615, + "acc_norm": 0.711, + "acc_norm_stderr": 0.014341711358296183 + }, + "piqa": { + "acc": 0.6920565832426551, + "acc_stderr": 0.010770892367463689, + "acc_norm": 0.6985854189336235, + "acc_norm_stderr": 0.01070624824275376 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_4.csv b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..bcd00ea64c98b2c805f94c3b7db23e352d30e479 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.35,0.015090650341444233,0 +anli_r2,acc,0.331,0.014888272588203936,0 +anli_r3,acc,0.3275,0.01355321116725194,0 +arc_challenge,acc,0.23890784982935154,0.012461071376316621,0 +arc_challenge,acc_norm,0.26791808873720135,0.01294203019513642,0 +arc_easy,acc,0.4734848484848485,0.010245347015573716,0 +arc_easy,acc_norm,0.4612794612794613,0.010228972678389592,0 +boolq,acc,0.44862385321100917,0.008698767182005266,1 +cb,acc,0.48214285714285715,0.0673769750864465,1 +cb,f1,0.33543859649122804,,1 +copa,acc,0.67,0.04725815626252607,0 +hellaswag,acc,0.39713204540928104,0.004883037758919964,0 +hellaswag,acc_norm,0.49302927703644694,0.004989296471157072,0 +piqa,acc,0.6806311207834603,0.010877964076613731,0 +piqa,acc_norm,0.6844396082698585,0.010843119201758936,0 +rte,acc,0.5523465703971119,0.029931070362939533,0 +sciq,acc,0.742,0.013842963108656603,0 +sciq,acc_norm,0.718,0.014236526215291333,0 +storycloze_2016,acc,0.6531266702298236,0.011006857922124124,0 +winogrande,acc,0.5343330702446725,0.014019317531542569,0 diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_4.json b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_4.json new file mode 100644 index 0000000000000000000000000000000000000000..752c135aec96912137945c03bc617eeebead308d --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.35, + "acc_stderr": 0.015090650341444233 + }, + "anli_r2": { + "acc": 0.331, + "acc_stderr": 0.014888272588203936 + }, + "anli_r3": { + "acc": 0.3275, + "acc_stderr": 0.01355321116725194 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.33543859649122804 + }, + "copa": { + "acc": 0.67, + "acc_stderr": 0.04725815626252607 + }, + "hellaswag": { + "acc": 0.39713204540928104, + "acc_stderr": 0.004883037758919964, + "acc_norm": 0.49302927703644694, + "acc_norm_stderr": 0.004989296471157072 + }, + "rte": { + "acc": 0.5523465703971119, + "acc_stderr": 0.029931070362939533 + }, + "winogrande": { + "acc": 0.5343330702446725, + "acc_stderr": 0.014019317531542569 + }, + "storycloze_2016": { + "acc": 0.6531266702298236, + "acc_stderr": 0.011006857922124124 + }, + "boolq": { + "acc": 0.44862385321100917, + "acc_stderr": 0.008698767182005266 + }, + "arc_easy": { + "acc": 0.4734848484848485, + "acc_stderr": 0.010245347015573716, + "acc_norm": 0.4612794612794613, + "acc_norm_stderr": 0.010228972678389592 + }, + "arc_challenge": { + "acc": 0.23890784982935154, + "acc_stderr": 0.012461071376316621, + "acc_norm": 0.26791808873720135, + "acc_norm_stderr": 0.01294203019513642 + }, + "sciq": { + "acc": 0.742, + "acc_stderr": 0.013842963108656603, + "acc_norm": 0.718, + "acc_norm_stderr": 0.014236526215291333 + }, + "piqa": { + "acc": 0.6806311207834603, + "acc_stderr": 0.010877964076613731, + "acc_norm": 0.6844396082698585, + "acc_norm_stderr": 0.010843119201758936 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_5.csv b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..0140e8d0dfdcb4a5c8865e7ba4ca428d1ab772f7 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.333,0.01491084616422986,0 +anli_r2,acc,0.346,0.015050266127564448,0 +anli_r3,acc,0.34833333333333333,0.013759437498874075,0 +arc_challenge,acc,0.24573378839590443,0.012581033453730114,0 +arc_challenge,acc_norm,0.2645051194539249,0.01288927294931337,0 +arc_easy,acc,0.4823232323232323,0.01025336980569896,0 +arc_easy,acc_norm,0.4553872053872054,0.010218861787618725,0 +boolq,acc,0.4434250764525994,0.008688893661318225,1 +cb,acc,0.44642857142857145,0.06703189227942397,1 +cb,f1,0.39049382716049386,,1 +copa,acc,0.62,0.04878317312145633,0 +hellaswag,acc,0.3990240987851026,0.004886969266944277,0 +hellaswag,acc_norm,0.4933280223063135,0.004989337148572078,0 +piqa,acc,0.6817192600652884,0.010868093932082235,0 +piqa,acc_norm,0.6817192600652884,0.010868093932082231,0 +rte,acc,0.5342960288808665,0.030025579819366422,0 +sciq,acc,0.743,0.013825416526895026,0 +sciq,acc_norm,0.716,0.01426700906103131,0 +storycloze_2016,acc,0.6493853554249065,0.011034317290463294,0 +winogrande,acc,0.505130228887135,0.014051745961790516,0 diff --git a/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_5.json b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_5.json new file mode 100644 index 0000000000000000000000000000000000000000..888ef70013f1f54d4f9abdae298211df4c17b705 --- /dev/null +++ b/4b284b1b9c4seed3/evaluation/rankeval/4b284b1b9c4seed3_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.333, + "acc_stderr": 0.01491084616422986 + }, + "anli_r2": { + "acc": 0.346, + "acc_stderr": 0.015050266127564448 + }, + "anli_r3": { + "acc": 0.34833333333333333, + "acc_stderr": 0.013759437498874075 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.06703189227942397, + "f1": 0.39049382716049386 + }, + "copa": { + "acc": 0.62, + "acc_stderr": 0.04878317312145633 + }, + "hellaswag": { + "acc": 0.3990240987851026, + "acc_stderr": 0.004886969266944277, + "acc_norm": 0.4933280223063135, + "acc_norm_stderr": 0.004989337148572078 + }, + "rte": { + "acc": 0.5342960288808665, + "acc_stderr": 0.030025579819366422 + }, + "winogrande": { + "acc": 0.505130228887135, + "acc_stderr": 0.014051745961790516 + }, + "storycloze_2016": { + "acc": 0.6493853554249065, + "acc_stderr": 0.011034317290463294 + }, + "boolq": { + "acc": 0.4434250764525994, + "acc_stderr": 0.008688893661318225 + }, + "arc_easy": { + "acc": 0.4823232323232323, + "acc_stderr": 0.01025336980569896, + "acc_norm": 0.4553872053872054, + "acc_norm_stderr": 0.010218861787618725 + }, + "arc_challenge": { + "acc": 0.24573378839590443, + "acc_stderr": 0.012581033453730114, + "acc_norm": 0.2645051194539249, + "acc_norm_stderr": 0.01288927294931337 + }, + "sciq": { + "acc": 0.743, + "acc_stderr": 0.013825416526895026, + "acc_norm": 0.716, + "acc_norm_stderr": 0.01426700906103131 + }, + "piqa": { + "acc": 0.6817192600652884, + "acc_stderr": 0.010868093932082235, + "acc_norm": 0.6817192600652884, + "acc_norm_stderr": 0.010868093932082231 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbb1f7c579711c026a80dfec71c8a7e7ea011b02 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a830d5087849aaa054ce41f4d716a8f60c0c1ad5f931cd55571e204a3165f50 +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aabdc7a173eee308f471eb96300a8add6e90b94 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0a8f4d5483a062f098296a288409e20cef1b941b3f363877f7a797d31f3981c +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f421fe9a78a01a0a8986306c2332fdf82a77650 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31bbb354ed4dec951ce4a64ff0b7f767ffe4df7e9d9443c2cb2cab71ca1268ab +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5effb3624f829ea4f7992eaabb4a3371521686fc --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26c228799a3bf67a1e59b4b42d82aeddfa1a4ebd40cc0896101e0c62c598b3e2 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e45a5ee5af9d6824dcb017352b27772aa118e55c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:181220104ad55f0a2fbae6a8c5b1d4cefa7c5f6cf3e25a118810f95776eb120c +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcd7562207e03f1e47c3573dee2182a1b7eb1b97 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5008278b444db0047628f3292e5c109542ba312218e2edcf8c770051c4b7f1b2 +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23f2127ce0b3cef226b4922b936059498196f6b5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fb9acacfce43877f29caff78c05871b6fd94b37a271783824ff68afe4d2f4bf +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f585a33793ace6182b69036c33f663042ab25adc --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99be8f35f2bf4af38ef4681c5f09aecf0977d5811c1ea3f0ae972f11cd993d29 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97120f7be60e925434485310e26c7aea9f2530c8 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eba1fe7d94ba26ae958b1693f38bb3e9153f841c40404b1465fc5d90e2300d0 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33722af12e1f0dce36473070b174a4eb678ce97f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d725244510335ff939fbd7ec93c22d1de60136e5504cf8f6d04e4096e0937910 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6d890342910bbcf301e7d0b6b501f524a561d43 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96948e6832038174de9dc4a86bbb4c7b9619c8309d866463967e6fcdabcbdfaf +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0aacc3c66125f69db198f76b2f7e3f35d3c7f08c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e92bd50720286c3f2699705820e089543fd801f32f16eaaab65d5550fd489b2 +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd575d0b8379ca74b5566a7c49cd01e5ef3230aa --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c167ccf848fa691a2d70e23cba4e7f702a2f51662392afd48439a381c98bac1 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95c7b0761e142a81d960039e9451783b99fdf4f0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:233dcac969c729a25c79c5a4ab917b8ba9b41ffdf6f75f070bd82dacc93ec110 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7246471ddb59ecc72496e847fa0adfac8eee57e6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:264d7d0d1b6d4dae05c1f877d858d6901e1a401dfcd232eef81de436bc53138d +size 199058669 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c87df1c8d5027204108bc106980796c2c0b15292 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea76d3040c2e9c5a7432c415392ccbe8e816498f766c40d2156152761ada0470 +size 199058669 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a750561ccf1ba05245114c74b4596afb1e1214e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e0408ecc074118f0c36bbad96e1e6fa3c20f105f8d425d99e4cf79e21dbcb11 +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..668cb3c343aefd7ddde2f46e1c362395f6ca2df7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:803f5d79f5199cfa2c48a8e7e704f90fb429c9313a7b976b6865e571558210e1 +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dd8aa4809bf95a48eef5d2e7853419d71725ac2 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e3d62ceffe0ec18a828afcc1536ac475bb23b323f8e8fa8dc7934b118c612cf +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59ee5849415de2e9c31f7f940abbd9f7cd43c3c3 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d20e9795034f439e76e2768af6868e9380228aa9417ac8df7aad49045e7ad97f +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7eab08f902ef40f4fd35583152b359b9cdea6bab --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a64c4e1811c6bff210903a981904f63e7fb756602425a408af333454d27a819f +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67d549af8f3ddb52bceeabf76709c136602e6d01 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e401dac823d7975f32b84498fd2df66ebe5804324ec6e5f6def96ef7886f0ba +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..195e5227faa2def1cad28d1484075bd37f10fce0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1a5ed61fb1e74908038504fd698d16ab9bb71f5f0e7ac33b49b001054d22ff9 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7246041e5eaea690e1c1c5f9cc15d63a714b5d2 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:891853988c7cee1c24dd557e6685c7a217e28eac9985de1ab9d0e4b66bcee319 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..464d591472f32b10bb0ce054684504f9fce6f258 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d245a3492df77fe89c1a93c289e511b8a1a34e4a5293958ffca34cdd9792bb4 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd33905341514078445d30fdd62265e861b3028e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a161b01eff5a5279739779ceb06103816ff8bc88f8e7e14c3ba309fe54516128 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d14205a916861ee8c83c7f5ace52febfdd5c9f6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c605c4afdea3d11ac446d1bb23e9fa58a3d7e45267b06554615234c82f2957aa +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f20ce2e00404970b6bf0b3667690bb0f90355fd8 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d552786a718f1576f3d5ce25dc513b9daadc738aecc574084c6603442f1028b7 +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb48b59e2a6f0491b06cb4a1f04c9b87f2c6cc92 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d5fae29a948eb27c556d04cc1032740cd11e1dc3dea02eedc3f6eae51ef16c6 +size 199058605 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae387aae0211aea7266e51597ed5f349ebc130ce --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c0a73142c5b8f232e2fa5ae1f156e85e32683ff95e4b68cbb4f0b0e4692617d +size 199058605 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d2cd0768ee987f4f1347acbc990b2919dad8b02 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f46fd047a3682bf2a6eb131bb0b63e9901152077d89542b4fe055a049dbc7d1b +size 199058669 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bedf32f1211cec8790fede88c082da78a7b9937 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f38a03efafe286ec65ced4cf2efa5345d81bd3c8b05569f727a80d0f748f810 +size 199058669 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04ab67f57aa56ed9bd9a5b999cc74488322442a1 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b428106ffbf5d959e7e7f8a3923e489bac9ee1cd17af6c7922ece3e641d3f251 +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adfa7eb89d5eb3190fbfd5021fce49748f4eb8ff --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34f7662c5ac220771b3d62594c380d0298651115e4e41f4b1956dd1b9b1d3997 +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22d56722db3039495d7fb6c3913663afd237c384 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fb7db4c3bf1bc370d327294d5478e782c8ae07ca4d96ed214ba195f49e6f5c2 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..110e7384a1a8544711dd11b1b477591cbfafa355 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be0feab437ea7f396301f520918ce23ddc17e059b2cf22b912f963cd5c3ddeb2 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37ec2377fa13ddb5cbca5a8a76880bb7e54082e7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc9bb67e241f6cf18a8d2bb267952f5871e193b186071e4fe01a880abc9316e +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e2053aca4c8f736679791079d5f78577e30991a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4d84af413581d3302c3648213ab2d9d476368d0d4312746175dba945b8fa20 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ace3e12f0db103c397713c995937afedbd317d70 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b716f96b15dd7d6ec092b3c8f5c24076b5f1b9c10ffe0a2d6c01aa7bc24f7e83 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ca047ecd540eef6c87448dea240018c73f818a5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b46ce8cae9e884e2596ac27da30fb996d4497b7f4b5d4bd13e5dd81101d5d72 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e22192f5b19189c3d0150fd912ed2435a5259296 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ae8e9df4abf2871b82fcfca8d9263dc5415fa0ee5c281a6bf0c3918d9aec2ee +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a342e947664a0fb4204344270e3bd6c7d551cbf7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34a244363a75def16e4a2d2d998389d80abbe1c8f71ecb4d63565b735be87593 +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..654d95d067b34cca814bf083bc512a8335e30fd8 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0326c2b95dcf61ac384901f055281191fb49d01609c5425fed71178301f260fe +size 199058669 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7aaeed0d7b069060e05cdea32acd70f892523918 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d641767b89fb3321bb45bc768829f118e01a01ddac32b450d34c21aa003cf7 +size 199058669 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58a92e88c64e90612f7808f934621ff8e98722fa --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1326df536b4f7a9d553011d0bd2b8799c9e93760f3179c49bc89b7790153c759 +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c30677756d88eea16da747da883fb7722552ee0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f05a69fd833c413ab906eab3c4e79d29987b11d1c25e93e502a75e70496655ab +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b62f067ed5349a46c1fb47abf3d261ed4929355 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f9f59d13f09b61017d5d75f69a515b65110a26561d0b9eab55fc85ce57c2302 +size 199058669 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79acfca0b2eec70e5614cdf526f637042db8d618 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcf8639cab863a089b12a4eea53687ad435b29c3e923f699f5d20ab8da8c3e75 +size 199058669 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e15b800d57d9d872b2e040d1bcb8ce9aec0ac41a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7098a06e7f53d9f646db13f57a9fd27fe1c2cdd9c946e7f9f0e66cb8196f1ab9 +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..697a3d19566c691c56ea928dba42406cba077ff6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66959b19bcac39cb5d6e6a3052b9d7637c68e6487122dec652d96c769eb3566a +size 199058797 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13f6965c38ecdab4e264228c392abc19c402b761 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:794d3f45d9faefccdf87c85f9de7b7fd0f3873e333aaa4458bd4d54585113c4c +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..beef8a8849ad2501c9ab93a3a9bffc1d1046102b --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43e4aff639daa839940b722a7e7a4ea7624c59c27b177ba3ce3e939b97056cb5 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a597c5f861087f42d9d8ba303af159ad4442cf5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45881dbd48726a0488ed97c109f5c37c8cbde94740076ba9250f8bc7113e4429 +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62c420f53775d50619d8c939b3ccf22e93548b8a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ced593c97f147a28ada8af4314e6a5b4aa0c22de26bbb9dd89ae99eb23c126c +size 199058733 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d53e50331cd02e7d5209cf81100ff8f1efdf48b4 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9669ec08834cbca4d1efe8f146d3c75ea09e0f3a35bd521bc2e68add5c494fe7 +size 199058669 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cdf3f40fdc4079bec70416a23c23342b02c0097 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4190fd837acf4cc5079221aeece9c1b6d271764a794d00f2c0416c3fb4115bc +size 199058669 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe704a446143bf114276f6ac7846e6aa4a949950 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0ede9c96f84a979878c5956ccc268074d7fa62a471b6298fdb8176f0dd687fa +size 199058925 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92a874bad257253abc78040dd8e1aa518f1e065e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5d730ffe5718e3cbde189c59d693a4497eb25a9e0e6445223914d0436151b2e +size 199058925 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f6b49bed7cd66d600b6666d0fe49712b2146fab --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc46c13496fa4cc3fd86c419a6e3dff8a9d8aa267cb1a897de547aab4d4a1bc9 +size 199058605 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d81ca700c48001758a0aad6e9bb1110ebe24d4b8 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2974648fa3e52b9c432b4b2c21ac7bfd4257ba3601c875dc550eb760fa9360e +size 199058605 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43ae92b1c91209f5b6417296c9beb34c56aa5e9a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d22b9a4e4b30d9725c3b96a9b2d53e38239db8111c16049e0e19f6b3bd624fe0 +size 199058605 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b552e8553c8bb0bac990f822e20f4e88d511efe0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:603dde9dd459aef6735656bb6ad83af77a6498f725aa719339cd75a927a823fd +size 199058605 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dac0ba6618ac0055645af2ca60559645ddea7f82 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9c4af1778c8c7d1795c178beb7becc5399bd772006f92c0b44cef7562640dd1 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d5b3c1497062c00dbcf6c413f3ac97608654d29 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7759e3c45973634e4484c338c9a75d6537108b3db30149a4a1a4b2a8e125a199 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99bc64dc84dcd3d8a20164dd5cd1b4aaf6a8d20c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b0295d1c28a1249626d1ca4468873491ebeae9e214bb0c9edc6ce56f048477b +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..95e86067a50b836e56527fe2d529283eb99c59fa --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bc5e4968122ea40aeee0f569363a54900bddf7c2b7d5b0c878139d8b4bb94ef +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56449cbf570cf0f614e1f859fdcf68702e2a20b8 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96081ac869d3c1bdcc99646abf66bf01f2edfbb17060bbbbe356dccc0cb12f34 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f387d06b8f85fc96f55a6d876c1997554575b643 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94b545b4eba31c8f1cd6e1c61ad9a3668b27d0a32307729b9210bcea15f8b721 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a082fd1a2efa377ecd72411938808d87eab77670 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7417f9372a63b6c94e4202a4709086fbbf6c0262ac42e7c485d34a116fbf12c6 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c51fd1f14e40a83fbb1a6b6474d0a4b355e2d53a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61acb1fd39e499bd0b47d95c454322fca4083a2d9a7473651ace8f2980250c8e +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..075b69a6840da1425fa308d3f9adf9318088c5c6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a60eef93f66e5c2a40bb52842c56151eb5b29dc85a0a06c0f0719858a684896 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..159d3fd6973e8515c043fd789130f000f387e143 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d729caa157331f053b92c9ad418b2ebac11662801b12f47e4e6f1b02dadb2a6 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..198b6403cc5b2b25141216f819959452d7ff64df --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01ecc5f03f3f73f594b5ba15cb1f3842dab2e8fd3b45cd0ea461b254e6c45494 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..265a33d1a5ecac020861bbc487e25ef124e2a093 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:146e3508eb953ddb194956ef3a1b5da48a6b0a0323c3c396ae93bced1525aa4e +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ec624087d34bcc09bfbe4b3da9c6724bc03b860 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3445d568c6ee16d1d5364516b588f54d1b6644f2de58895aa29045b5055d71a +size 199058978 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d989caed1a7ee62edd1f2c9df9b2fd28daab535 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e585e5723ef232b1df9313cfd1f873b31a93c71fe2240cb0fd2cbfb4a36af60 +size 199058978 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..116db7b1bc7485ab08954e70ce618673f2cc3169 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5141012220a0cfe3d87f95cc4061993ae53f2774cd298bbaf88edfdd4300ed91 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec69444f7d8a16e1ba999ccbd117dc29ddf2e7e9 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6c3d2db120ad9c97fe489887cecea13bbee7ae1f95f9b2ad5e8d6fbce206f4a +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ab574cc8667425bf1cfb6168e6d91f52da3efe2 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:916c4cd8343a44764774bdc203e5545757275a1b245f80d136090091c94a9070 +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c58001392deae724824b274dce8b181e38064b18 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:043bbeb1d7aa5a69032bf342cb77ddaedb6e26c712bbd4f9d27c49e846b160ab +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86549c5519742b936070fe8564e800c988eb55f7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2817217a3589abc6b9567e22311831a1df40d8ea9bacb433aeae13aa2f8e58e7 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b518932463cdf677ee07b610d7a3a779f0480fa --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de34c31f88485315587e827651b3c8243661db13409ba60d5c531461d0e426ba +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7d45b4fb16b0efcf697983bbc7963a6e7568daa --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e666f3d866a589354df0804cd22dde976b31497d9fd70131e601ba65f515a13 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b67e0b4fcba5cd739f3010e77a3d02e7719cf687 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8bbff2f042fa13ca8cf81c9fb2d488f2fffe021d0ab26d2be288f0ec17c9b8a +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cebe8757ebe10c9403cd2f8db918c4a627b15e1 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c1ca07cf334b82d115e3696c18afb1ff399ced51dbb424d32b8088f12cb2e5d +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3350df4f7934f729e6fef276f8c7d922a3aabc2b --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7722866cda289c356f13785a0f708c62d05068d43fbc5f8882b3d4769feec65a +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32448e62491daf89e7843263b2e608612ac8bd35 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e46fd0024bd3aef808fe4c99de1045eaf9a82d75281de3d4a75947efabfdf7ec +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a3d8f12dcf9e590ca7d2e862cb1d1cf49a5e67e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83c9efa8799d62016ec57dc69b27cf4d876724deb8e4af88d2a8f8c8f8706c2d +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3516e9312df5488cb6cb58e5bfccfc33576ac5f7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06d5c5b70f5d06f5fecfa41d7cdae3830569cbbf90ae9958e73b2594bc80a8e5 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc4eecda2a2271ed891877fc7b24d15cbf54c76a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:261ad5167d88d45c47285540977c853f7aaad06fa9689db730f1b1224b8556c2 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af79ce9f3d317bfa33e35eb436418e773262f9ec --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:019f3ab71c63d882e22f207ebffefe4f37da9ecb6e90837e1cb7461d7b450d67 +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a80b1bbfc66c2af8b11f244d279713632e8ce7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a2a39d73d8ec556e08b30ca464ed73a677974ac187120f6ef4fe3304bda290a +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24069c3c19d91d305f57c8a288802c5528d65227 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45efa951a10ed72aa97aa5bd2a5641ec763812fa82c34edb3e09d6e5185fc5bb +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b1656476e7b51826fd8b1cd8f1b039714b99e19 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff08f3878523efdb0d3435401562d38a8f715b01cc6a0694e8a1f18720f8f1e +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc53f699a779f86d9ae8614896f1261d0fd01632 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:248c4a0704e8dcf0658e759dfa082f39a95a0bc586d39ff571403b74d332b681 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2ba51141c5e52f2a7c3f968505a4feeb4022cdf --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a323524892ea7fc2ffde74bcc4aa61467b0c7a324a6e3d463c225b099a4bfed4 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bd0fecb99bb5809cddc6fe5d1d1e5c3eb7830ee --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c88c3a1c74a3f10ce9c0963886cea5d1a4dc7dd315e293688403a2df4f60e5e +size 199058594 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87f26240d8e96e743bc65914ea80da2b59392ccc --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:718b8787f42fdde896cce339debeb31c451bd5c3cd30fdc6116415b63320a58a +size 199058594 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a458576907a21984bcad08a70661d58095bd8cd4 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7766a27ffec97896f72e416a374d4fd9f6f86016b8949cd359c938fe719cc833 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..847e45aff8a8dd8a2ffceff148a0a047e0a118ff --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da366d2cca3c7710cd5fddbaf7cf5fa1a5c4a02cfa2cabee6b3299d891208af7 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e5eadfce6ca3b0d107091b7e9d5525d0cc60730 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ec56e3a9cdbcfbed33ba7d68c548d15bdbb92b7f23bbc6f0fb52f07202e2a53 +size 199058711 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efec936ae6420275faf5a6e26d72f32b869479b5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3999a4a14fce0442a65fd0984bb10ade16d7162c01d6846c18552b416d750f4 +size 199058711 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cfb3a569a6d839f061309f15ee2165ed07ee93b --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5fd77adef1c6f44e938c445d80ed9664182bab6338a467699b39bd953ce89881 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eda5995af7b4370732f3d567a8c627179255b7b6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e643d4d2007064745be49c9a4f393967518bbd0d61c226563e480bf2d76e8ecd +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..575c05b80f6510f4fb53b9b505738255a7d1bc98 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e40e566436dcef98c3b49aee893673ea387c78a8166321de31e2af2d99c8824 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8876e510f69adef5d4827dcda67fd05f504fb3e5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2eac488df39cc75b9a9b66c2ebb2ed480a7b83f9832a2512048a0252f4f4ca7 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7be4c624e77c0c505ce77c2e70ffb084b371db21 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327b576f3fffe78a5853050cf1e5d9d0ebefed4d865d72e8ccbddae6916d1b06 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75ff183c2d4658c1a26d4ed81253ec873696fde5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b080c064104a7127ff521fa0307cea7a98a152649a364f11df8d29e010d7cf7d +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..780e1e5590771e49b633df73aa9a102b68a5ce85 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e0beb349fe2798c348f56d33bee1792cb37dfc9c7bba050ca4abb2fe8027b90 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39167de05897c0d182a2ede0d9b6748484e8067a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d85fae9c754edfe7c1f6856cb08c44f972cd0f3ca69b84dfe2addbf74253e8a1 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a91f82e614f7b243be51061595c3dc9308f8cc70 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73233eccce759a3c14989fcc47b98ff0355d20872f6795b6d021fb6d7e48a17d +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f76b7a9fcc8a5e6baf3624ecd652c5f26e3bc711 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e728523e7cd06fd176c43a70ca0b243dd14e0264912ce1d24327996a16ad3b5 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bd64e2c0bdc39e38382bef3a19d1a55e4a84cf9 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e5d8498c58a4f4988593a6a4d7cb0f02c27a9f8a48d9d63a271071725329478 +size 199058594 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b52225cee1c2a1d92da0e65d7df364402c9abea --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bee52161fc6344e8008e21eebf85ed1054a69bf30fab638bf2c4a538bf8bf618 +size 199058594 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e22743e32dbd9229dd8afd43fd2fb12f49d75fc7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79b3b487cad6b47ea9965846f51c3975f8b5986e66eb70d1676ada3985e5bd87 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa7c25560d8d2304516f0a518f927817c87ae2ed --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dddb8cc03b8e53e450a9c7113b4ccfa6974fcc4bee36af5f59ff7004c69d9229 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46ca40bdf1d533113a08269ddfeae365ddde8d62 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b88703b9cd19bac26de810052e3f8fa349cd904205b6d67bfb46303c013be6f8 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1b2d799873432369c6dee8d7749e1f35a973fdb --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21c49c881287dd48d644e0dd2c1407b58595843ed72641d2b7892abbe691f5ab +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..004914193741a6e5b5f50cc0d14545aec974b052 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:345ff4fb07b275314139b6ecd9b05ac7f7da73ed05742686b6831a72dfa55f96 +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44e8396fd7591fbd46ed9465c99f827b84f3e4d0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73e2288cb1b63de523c4033e33db697c5adc7255b808c7f9b1ee0c2a22345c78 +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12db7a819f95707b36c523b7beb604ffe490b025 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd897da6079c3b29326c543341613ef1c8b33d12583cb869951ca6d81f47070 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d4625f3c70dcdd72e7135add46c8d687c9dd4f6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b59e044b1cce56f68e9a98333d8dd5e8bf7bdc0a773cb4ebcea27ea7677cacf8 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a587ad625f0aa53e84350a6b112c862ac27e4e20 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30f8ae1d6310b5b87d3bfe344838baba623f5a74ee8395981987d6d0f6deaf0b +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bd029d86ffcd1702504abf28b6773008b11a143 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1143bfa3ae5a13b4a6de2b96195851f109b22d878655025d1f10cc6cd6f97efd +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e47858c6b510ccbfabeb2f120f20cc99b37bbdba --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6cb77288b58bd9f5d5e7d6d69fba6414c334413bb180704ace36d915b91e1b0 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f00d5e8fd4c5b128312bafd560aef750666211a2 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afa78fd6295402ca7985a7f723ed55cd57749cabffeedd30e2f143b719764efe +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..576488465d0c6e8f9b46370fb6fc3e217dd74b2d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0e5785fd2b4b1466e40b2772a86d09ad47cad51edc3a2d3e97262ee3341a915 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..558149728978c214a22cec8d815e75d95ae76468 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1f6860c251d286dbe6c37173e46ac6e08bcaf496e5adfbcb2097520cb267c91 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee65639d56f75a2132491c77e27520a8fe9a9e7c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9270aa125069a295349a7edebecdcbd787533b320abc0446f44040eb3b68da3f +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e4ce2d1d331c0892a606122744a20dc2a61986f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b959a16d0a5c4ffbee85bec30af041ab215040cfc55b330fa118d590e3ce8fa +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f32fb382a93cbab6f4aa897303587e672acc708 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:564543ba2bd6115bceb7ba4520fc5f46b763ae6be7666ccd22e4ca5dec4fd4c7 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf6f8d2448bf79f068f7e349149dda93824b466f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b58681e1ba8f6ece1917b3c9bf6508faa732cf9b6f4a6f578b51e1ee5373f53 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1100db7a01c914aecfa3ef5b605136d460730fa5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2557eec478e9a4cf142afefe5edd6d40a20d9afac489fdcdd4a196e8d23448c +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c3883491de180641f6a1d6e9635b09db3c762f2 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:201ac210e521e915089bcb80f9285c03384d62b8630ad74d65815cadb094c70a +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73f2554dd9a526c5efc44d2e691cf56e44c4e63f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f36e8ac073d1814797d77f4e2a4f2ed6cd28a75e1667de4db8650e6ac5ba737 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..876188477188691a9518f8d9845b355e0995d3d2 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb041e717967ae4d87052570ad214c0b656bb287edc0245e07090c1093b40865 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b77f2ca862678e8ed6dcc5e934dc8004f9393ea --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cdfc3092de817c87b9665fd7db7269f472aeea37fbed899f39bdd881a62c236 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12d03a7fe1187e2266f6187ad4a5108105ae9774 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:804a86261aa796b3ea2df24d67bfa1e06b847a964ece834d21d3afe552993856 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f416e7e28fa7d385bb9a21812a6f58063199b4a9 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95e70a315312f351f5b3624c6dd4461b0bb0ab68f56e937a06817a647294abf9 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..334b09450798b3d98f6b024a48f526623d2d35c3 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:659057758a12ebe3b61e095eb95ff6cabeaa5ff5bb21b40e9760106e7ac3d4df +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76dac5ccf92e5566bf0c8478fc60ed3b3ea26319 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f350fed985e250b91a448d8dfcc3f7d09a42de9bc7a33f7521132978b0718056 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..582af76412c1f6b05afa4977e8bc2922d995497c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e081d524acacee536572fc2d0129107aa7712586e84650c4e31b11a45c17620d +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d6861949e9929e8c463f53b0b3c4b90235d1f5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98357c75bb007b26d4acca0cd11742433038d6872798fd832d3e8eafb8d639f7 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d3d080789c707617f3a60044b0093a5e456ad0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75177188ced4720fbb0198bfcbfd9c0f0862dca222753826602824132d132b01 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca7ce6ec1f5941edaf4ef6e2d4483e4c3a99211a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7933cb5ba0565877184f1f1d4f65d6a6c100e16a929524ef1f7b3e2f0e04d2e5 +size 199058775 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b1ef7880a8418f3f925877cfd11834fb810b20d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a14604be34858e58935af5118adc6ebcfae0f2f60348fa10b344bbef2e987b37 +size 199058775 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccf91f6516b85c16bbb010c85a83935afba7b0e7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07c16f51e91066f74adeb9f94a306826cbb9511a79365fd6ac155d621402b93a +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a05f07af75889786cc844d95908ea2eb21457f6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6604a2b6e31f0174cb2180c84d7b803c10b05a9bdd403a9ae5bd82e97a379ca8 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eca936bfb3537ba3e89b5c5585731b68af056b9 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb1f245e4fc794dfdb5e555a4e4a36798a9ae828dcaae014835de5a153ff5f88 +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8da31278f113ea68894781944b82d8c496add81a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:565fa9d1dfba398794f045111efead360d5cef1b2eb7dac425ef6b0110011a90 +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48681e8447d24b94f20a48b72107e874c8c6ae2c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa54b86f26c6d5f38aad6c785993a2b32936808ab7affd86b11f2a7236b544cc +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..896548dfc6b8c0d4377cd9de9d62514cf759334f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f54e1428595db1df683eb69c77846f19ba6efb67c6c56060f68edbe26631d6b5 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8865563471b749e4fc3b7d7753992735e67a472d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95fe8688f0e649c8fc73095699056faf5a50501eab36ae38a032120d8098c162 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20203d14031c128c835fbad84678896eae85c28d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40fc814594fa54c90e2a4f15cd2ea4062763cbb35d5466bcb4bcd2d5e07a3c0b +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25946a59ee906a0e73eb44e24bb8841aed845176 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5944b32b8878bae21eba32d80fbcdef369f460f14bd42bcf3a68f0d142ed20f2 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90ff0beea38fca65f4d2531b972dcf0d71f70872 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:284fe66b2c86b2508613207edd5d8e50fb08c6bde95a10b175721ebab7711fbd +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b784fdbbb11989dba350f4d633012a46f728bf1a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cac74a60450c437535ab44ac141e6257bd62b6c5ca428559738ba0ea647779b +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d15dc12857c8110cd17610b588f003a51bbd60a1 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d6b8ce892000eb22b5a627210b11d87e265de2f111455710452c508bed68df0 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c881d3b3a27d648d880ed06817e0bf64dacc73f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ab2ac3a81269ea30d23b8d163428243fae9e55d641b39e9580f598462710138 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a932f5b7d35904b7f79ace666742ad874f56e2c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f785a403677eb50539fe3199e6b0a0b8c1d16e3765b491597c233958e75ca6eb +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d430c0f1303b7db4ac163830476bf91cffae155b --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6803db9dc8e95c2a4825641c4e5a5a092867fa2bf219b4cb92b1dda0810f9443 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9c7de0a00cdd4c5e9f53ca95506d96653372408 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85d05dfc55a85d8d19640b4d4fc76b5172ed172e1dea135999e5745d46d3523a +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06ae4940c8d4cf70a006c6f109edd01a00810873 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c08acd3940de6f044d2df0cee492b22305110e56719e97058638e46560297ac5 +size 199058914 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f4e7e35c8365a1013ea356dc68eb4b053805ec7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:721131244244d4572abf258ee8860841c5f86c73e572265dc49fdec5bb5df2ea +size 199058914 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd8b3cd98c924006bd9d9ddc32162890dd3f073d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:754fc67289bf4c46bfb7cf9dddf821bf30ed49841a8218050091e5d5de4f92e3 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dd8cc0e8ee3d9218c1721d7b23230b7890c785f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d33c5090d1a306182f80d0d7d7a5462242f51b50cb576dcad093ce39804dc91 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfd381d2f7aa61ec95018898ad8c984c48115702 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be2f09c5780f8b06348f09b9505e3aa6b22f23af5e29d657a48b0443e3a4ccdf +size 199058711 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bddfbabb78dc614b304e793c99a0e8434752493 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5e8a1ab36a9cf3ae0fb2fecb8aca51d0e00843335877acb0f68e29525ea5cb5 +size 199058711 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dc2bc5abeb578290ac5d6c9139190a557d9dcfe --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:515b0c567cd8256b61dae348923666d9e829923f396f14cbe490aa384ab4b787 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a23e777528b736f28e65a6580a24d53169a2fe5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb885968e6f835f410a085852299cba9dc231487ee45819d08b74c7f6a6b14e9 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0acef4af489d95f14a0d3321bd765379044d8fe --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34218900275f3e6478a889c63896a8334fad5b38081e73d707b7bb7132fb1b8e +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf34d1e029aa2e7e0fcba05d8293e2e83bdd31a3 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70f79bf35619e94541e45c34cf4d5da7b5afd5151adbdb52b2e82cd42b49bb43 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dae8d84eec00556bb1b0ee9aa75b612f51cdd669 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0be763d0e611b96b521200893dfe1a830749bcd87032062d6532bc837d0a3372 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6ba29a6949ea6275acf46d28a1eb8ba5f7d9ac3 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbc175500b51eb531d6351d32c33ad691d6b85027052ea0c333dfa76f3db721 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..effb1dd87716031f221ef084b40d5243853ffd5d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2230678a3687a1a35a3e5f2f02a19b385e33861c4f8ef5e6b0f8fc91667ab982 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf7b138d4bcedb967569447f87c3717fa5dd7160 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:617c4fe8fa13d0a8b38081e02881740583caaf5359c59ad6ab0e4bdff4c443ec +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fa8d2076ae6dcfa35d9a49df1c2733b137b53f0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5334cabc0fa05ee2d7cb87cd27dc272455410401985ba57a34e5e8c444e1a7a +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bad243bebd9d6a12b6055f951ee559dc48872a9 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7faa3dcef67a859f12973c3c7200c58205f074bb201eee38a53710798c064721 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6b4a93ba67a51fcfa574355fd4726773aff4211 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1086947692ece6e0ba6d0ca193e89534e4c41e54ec7b6cd07b82861c1b9382a2 +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcf6b333f193d1dae87de8da6d3a235d3d482b33 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:764260820370bfc720c2f036fa929cebdd65b1f2384d03844fade6fac94995d6 +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e41076e4b05106646e954d675e18086979e88b6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dbe056a91a953b5ee5981ca1a202ef647b2ae4277e7d3c2d8045609f8add975 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12be99c531b6db833f6d104b8a946bf4224510ab --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:761933282dc7e4e5ec8f150e1aaf3e6a6690f6f89ad1abe2ae9d17cbd4f71f99 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62170830fca026cd0bb31e64a723a3500b6c58f8 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a71edba2c8a73fe00da188a704feb04bb14e9d9c72f5298a76c76ba1659fd437 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad1cc40e62a16d45c59a1c22c9b94081523b653e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1354c55428b5ab3092622f2e72c716202e2a84c4d39d368cf8a4d77882a39c29 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b38a95636fae56b993c0e0edd53b90e36266c68b --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66d747d9f359a2cf23feba67b6cec325ca107f49cf363a59979b1ae06e9a8dd9 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eb129dbb29439cdb56cf7b0757fc6d20f60d112 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a280cd22e68944a9b32510a89ebf2e9795c712ad09d028fcf7ff9de6e9c2c677 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ef28d449c753e3344703e78958dea40f3ed2ebb --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24c69c6e4c97739d8bcf419190e6a78897a685ccbdac66e356fc56f9f719a1f8 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..add3f554fc67f393b5141facc4fe0e10f1741370 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b26d6f9020d76ae2c03831507709f8cd9cd4f99cd24035fd62888f1c153d165 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e780bd3defff08f76803956d01e38eac3c2b4e8c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b665f537b2c68ae6de6ac61fbbd283d5aa18c2b2557a93e2ae68596b531bbb7 +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6408a63df6a3737ccba81e4e8631114f16bf3deb --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e36c731cb269574dc862fc4636f65e0748c4adf8f07f616df9a2a59a7d93895 +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd9af6c80b4b3281efcafed08b907476039530fc --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:629f7ca5ac271f1ddb2941c1ac8336e13b3c70d8152094507691ae9298f2677a +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22d196fe96230e19b41d91894427be418bc63f55 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b96534a5393e9b86aeed3e8b91fdb15c5baab0823621215d0dd41a0934851b74 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..137e1de5edaab4b9ac77d0d58b7fd4d62a23fb07 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e0c786908fe84dcca4001b91f94578dd91d80f1d7e1c6de5d27c3fe49cb8dc0 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3126337651058e4b769ec92d0c4ca7d86f5b1ed --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cb67bf6e914973c424e6dbd83d95e4a6b3cfb0aa4c7b99e756888f06dabcb9c +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..474c3cb316a51d8fd310bcc0099aa699d0afac03 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fb57052fe667aa740ffeac29555fac37f574b7c2622db9aa461a967b1222574 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7153bb07dac2fd0dc02a40e390f7447ee9b4d9f7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf3b9d64902366093169e8a36d064c645cb38326b00582383db9c8b3adf8ff30 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0f6ec748d0983f10330c91af166af5d6ce7b634 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:453dd27d800e6b7d8698e665f3f89e1be269f59af12853ebda7f52aeacd3313f +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e15f1c950966e2dee710b6eea68f6af2877591c4 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de6e63e803a28646c3d7ce03c02f2f5be874c2b4fb3ea914771cf20d848f44fc +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..292a3bcf33f3305746063ed99914118066555da3 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b948f02492b4627acc8d6d0243be53d66e898034d459031922ccc608f42832 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdbaf0f473d4622a643607477409b1235e34ebe1 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fe354875e733866507e5d6e34137ab57c19778afa83a01facb1fbad6cd21e9f +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64edac2a4cd633e20310fd1143d8d4e4ad41e485 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d3e448b1244753e04082d6b0ab8c1d67e15d9a54b73bac8733a9e5368fddf6a +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..928a71aa8cd58a96fc00bad80a2dbc120e08d909 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee44c146dc6c5497f4beab8178f7238197725679bf0a54e2b5173b7911dba553 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6497f158a13e1d8c9fe31ecd49a312d5cea684a9 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e85c5385b74adea30399fa9b4e039a600e9cbc29d237006c3cfd0da63580f23d +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8fb2330236dab9b42074d25a028dd4bdce7532d8 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b7a99948479a0414e66be377e52e392706f8eec2a9b59e6eb13b9c755f211b +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f8c0353b627c6ebba51e664766cbe548696fc6ab --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ddf0b892c30bc687763112d88efd82e420f36339ded75a37b2934557aacd19 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ad2be2d6c0dcf5ce8aa44c20dcf17fd33bfbcfc --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1586fce68acc444974689d8f90000a095b6f8401103494399c745b6d51839684 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6d0333aba6f84293ccdbd62c1abe00754f5abaa --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19f3853a177696b7b6c9883f7d9d8d2516e5d288998e95d029312d89185fd585 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f2f094fc04582aa30914a1940c44c6576abcc69 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:978d4f08718b5b9090fa34a5fcc412d505d46deb21dce66ec7b7eba56008d428 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ffa8db019ba6e6da07cf6c5c573c47aef142d7d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:607b7e7c129ca6057426495c6c8a457fb06475d9217281f6d703f1ae34cce528 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b61f0df850a1a901e0b13741fcfbbb408a1687f9 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6361a24c08940a1d4efd6ea7c4709ff52107241c5cc2582653c995186593dc5 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..946562e87e0c256baa1d4bcf92b56d7dc221aa2b --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d861f88e95117b65a45790c2209ad1fcdf192b62e4d8a4bbd144fe21423cf65 +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fad48530690f16c44303f798c79900b32aa3eb1 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:685f5edff24225e2a1bbfdeaa8be88b516a3ae52c930df2c869cb4736ceb9a09 +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..beb84a4771bb891f3e61114efcc2969bc83a46be --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3edbe2eec52436838ab20c79075f7596de39fd87345a35184323c89cc22b98b3 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b9b0a1fb1affbc8ab6796b27d33f3b8247b236b --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfbab0c43c2f415a48f3b7e8d6e69d604062ce3d56b97ec9eb3c1bf688b4db49 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5551da4a8f18fd45930ed2dfb29e24dd13d191f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0bf14f246e1f3364c37d51711a4e61cbbc68e8df9edd269f334ec74ef9b9586 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39e29b336f3220a6242304c2438532060550855f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8247392b946f1647c74a99cf63b7ff9974f00f9eb15adf9dddc1728cd70a8fa +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9021b1b05477f77edc7ab6d7cda82140005cadfe --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9844f2a39506d39e00bca18a0e22bac5445ed77b82bcebd7a11d64b49a08b660 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eeda482ca88736de3e25ed74a2e52c7086dcc680 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4adc79928bcac95279d606a4853de613acdc2bdb5ebb203fd9246b95a3d77866 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36d279f285621de584426f97a25c02652aca42d2 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b204fd9143626510ce18cff55dcc3d1e55a9c9e1f21a20a8ab8baf8265ad7949 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a1635ffec1c1d3ad32c87199536275db9340cfe --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ab97cd83081307e17a6bae57a0b3f7ffa024fa09d72597177876fdefb2b12c0 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21fbf4f49e73e2810eb6b5053af26cd8fb66977d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9ad56711947c730af7f2fd4454f3e68f1b3cfcca9eb52753866b2550abcffcd +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26b18f9cac3c720b36be2ac655739361bfd3be0b --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7780837c341adaf24a1f40837b20200450e5f27b6c9a5069610d4a95ab41bf2b +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dc6e929c57d1db253bbef3798fd1f1a16edfe62 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:349b92dde0c5d1f097d689b3963448771e53d4536ed29a2a877d1467d50340d6 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2683419d1d57f3bdbc131e54051044072be65d62 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b709d9f17b1187b5af17a7ed2b4500088c64d600d94d51e4b67b294ae31d9696 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b9962e1a24060cc2550ea8e09933050c3abe8e9f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd3fdb9cbcbfbcc882c887d56227ab5c5f63bf066f926e27b05787ad2fc8b425 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42c1cdd1a9d2dcfd42dcddc4fe3808af73ee04f3 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eef66123b64358567892e8eff6d99dfb81c5e7006a6d173210ef2a2a190df0f +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85d189c2ab1b9f3a2196d005db3e4c856f826ff2 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b5ca8ab1658a89e4996199e2012f4d41e36b248feb4028b2c414b105b013e1 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f8afa49a3f4e29db41ea552c3474023d8deacdc --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c08bfcf59a33454235406544b99a24c57dd6bdb4ebab51075dd281ece53906f +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0ded0a0d9c84339d3c7346ccbefe226b5a56177 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6578899a79edae255cd0b6b5349034915fcfb01af13b24bd58b43bc20f2015b0 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..053c92750d32fa1e3c0a82b921583ae53a6cb966 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c870af335ecdeac5f031dad019139501f79d581e41a9ff23ef328cfb24da7634 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42c8b2b191d0f3b818c705a1ee16082ee534763c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0613a095ed7c2d6e0e7b9b5808fc721779c31bfbde0b101d633228f46abd8d8e +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f95cec4b48fd1dd042ea0887cbd0099b3e59c2f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701abaced18b9c001b23db1c08ffe9a5bf60eb89cbaf9d525e0f3ac7e3c93bd9 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba430122e1fefe76d9a40b987865d362094f7b64 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a4cdbadb92d12628b9c21bc72598aad9c23fd97258d134e08ab79262ec40e54 +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68334347fe8285e4da49b5c6e1bcb438ccf953f4 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc675f18bfe48bb58748d9b24e3e713402086c03a004ff1ed87510903836e1bd +size 199058647 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77e85e8764d7c803ed4628f675c51fdabc4304b3 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:130140e1e298ea25bffdd486ef920838c12ad64e119577b6785d2447883af9ef +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2fc78d03046bdcef5bfe6321f458acb24449ae9 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bc5632568c8dcbfbc3cfb44198ba114cdc14bcbb9a14db4426a2d20d50fb88c +size 199058850 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5008409ca709951b1cc1799b97566982c9af7cdb --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3dfd963bb36f72cb780bacd3b05423f811f42429cf78d2d02e2cbf330c44f8d +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d86aaadf2bb1d21cd7aa6da412b20b9ac2d53553 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e26af67836815adfa5c27da9e3ce86746ab7136aa3755338b33a78917efb8d7 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..feb396c6ba9c8bcd0dc6843f531869d549b8a4b7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:727193f77f607619f0f4f41a74684b6a1cd4420678716b3845d69243da002671 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a8ef65e35dffa46d08011b8e87a035d67d64bfa --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:deea861a9bb8d2f9c481155fdee480c340a44dd726e8c55f00913b26f45d00cd +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c50a827912d5842062c25cca807faeab7909a81 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0861148952d318944dad02dd800c0554c59d569c1d9e807d661dc1541881d1d +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd9203476e77876cd30a4b0972a855321319e4a7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cf18a70813cb66d90f72c1f43f5e4121801075f090e236e617166d71f27990d +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1b21be5936315322b948ade3c0f9eddd40f471e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f4c3ca67442c1c227cf722292c19d108cec98585293d02115fca2e2760e5bc0 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f43493d295508e1c5341166fc3bb3c89333f1fe5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ce4a97a136b96224a4c479c5a02153ab3f1e23da282227b352ed4bc4bb3cad +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a50d7862484b00dd953297a2d108c0f309a7043 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed8ec1015c043e70ef85a7a7cfc27aeaeeb1d3981f60a5cbcefae31fc1f03b74 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3542d550dddd141c7a9b3acfa85b224760f53d3 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adc7fbef4fdc130df0ca402cf7af5b19b1fb826cec1fe34c6792e245dfc50618 +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf75b20bf8e2b2ab52d8696d9bd26b725c8c8cf1 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84821235fd5a33fff4f81eb0be883bae8203a951950919e110343ae801797b8d +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..871ea7f98c50c245d0c47913b586805b0e70058d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b93b5a00e391e60b8cf4f4cfd8cadf1ff827d0af2e0241c22b0d6906a04c96b +size 199058722 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b0358209959d3809777c8294575d1d64f555735 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a28c750d4e6f0a3d2f79776c0226f75ba3e1815185b98a135d689c31a523cc4 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d40daf09ae209f9951b2f0cc81b1f2b24ee1d203 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f6a26f51669d4b8ff0509d8202f7aa56c19639c9a03dac250f9819049631dd9 +size 199058786 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2fab366b35c31f7740a8a5fa301351f3fce28ef --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a622c6c0d087feda10bf2ada55d6691f9dd0a15f3de60bd66946bd140983ece +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4760d6b93b8c541ca4a861af4641e07742fefa86 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce68270f739dfc957e78dbb41bc0fb1d4b655b5ca3d235b2f048e8b834be36fc +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b80d87515cd2c16d7940fea330843362be25ed0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a0e1e1d4ab2bec5985594e7ca80d5ed0350ce5470b40c10ee3b49dc620a9dd4 +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3813a044479cb3997db7039b531ea9cd0921c9f0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fbc97dc4072c6851e461cc9a952988b7caba74a488dfbd6433fb7e99709e54e +size 199058658 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbd90c61a7fb987a7d75d9738499a26467741fa6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24f6cbd74769bdbd04ae8f4e9d62c7e4bcea06d5d26ed7c40b710303880236bd +size 199058839 diff --git a/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e34dd62ec4250d8f6e2b71c3d9ed43a75984edf6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9efe4fa38d614d3d0f2ffbcf89787a0f322a9a41c27b2b283d9a87619cda659f +size 199058839 diff --git a/4b284b1b9c4seed3/global_step80108/layer_01-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e885dd982255eed5c7c9a64c0ee55506463143d0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4de1b43ee059a65f0cb3c07a175d18729acd1dd55c7bf7355949985f3b6fd3ac +size 167511299 diff --git a/4b284b1b9c4seed3/global_step80108/layer_01-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6029ee2b8637ac603ace38d1cf95c00bbec38bf6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42a23f67a11035244f7777d41646050c35377a8eb1f7967215f626ebe3ec8984 +size 167511299 diff --git a/4b284b1b9c4seed3/global_step80108/layer_03-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a85bb35bda22a8789f6c1ad25d2baf5dcb833f5e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a30ec9768c974611bacba5acb4091ca769e8c182f42ae7f6472533ca9b6189e0 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_03-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa284243ec78137916b364655177e75b42470993 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20836a2e9cfa43cd07baa61bbfd3f55d930b1ae683b05e4dd018a77de4b82c93 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_04-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fcf2ff60e8b6e95afae6661bbe62a644819bb5c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9782f7357d6eb4ab2c968597c809426f8b514a30d9e93d0a0516e97a6596fbe +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_04-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab08e969793bf7a0f60551a668a36a2854ab63f9 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78db57722d1f1cb59721115bc9bffbb0f29f0873dec4ba8153a25819cf71f662 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_05-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c2546a37bd1996911eb296d44230ff6b45b2b32 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b2772d2fab335de08e4d2cee1d61d6c9d44d29608e4f0de671db73977f7e5f3 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_05-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2d687e0fea0485615d93316c58db46c38b0f04f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51862f8bfb40f0130388338d88d9a3abfb242006304fc68d1a8075b2300154cd +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_06-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3666ee868b5d00631fbabc39eb65536d990c5162 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ecaa8315b96162d406e1572fbb0cd1e6507b642c7f551a0db656292ff7e7666 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_06-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1030b90654bf558ebbdcc00d013940feef17d61f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:319449497627cc6bad9c13370c17e87e1a2f3acc96935eb292caff75038f4325 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_07-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e5341307501eafba35ef9e2d9edc544a7edfe09 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ef2f3c655d984c32fbba9d6bbf02cf06d9fc166b86765b8e10facafce4e09de +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_07-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc189d25832fbc0ff6048eca458986281be9c7a3 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2946e291020cde8dd99ea06fa5068304469ce0cdd7c64956005d975e6850f1d2 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_08-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..357f9371dd81a1ecbc1bf6c0eb9c867f162da074 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28d57464d90478158422132f5bf934f36b53effbc8e81432ca9a6c6d3a1dc649 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_08-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b875a7be0971f0787361fecf5196670155082bfb --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6138ff44997ef442fe3178698e3257f550e1ee877dbc041768f967bda313925 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_09-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9321a8699785e3fc324b0d0676af77ed4d6159f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a47dbfc40b07a8fcc43580ce276ca84d53c693365a9afab10be6b0a3620dce9 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_09-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..416b7c29f3e8ba93633a68603076b66d4c360528 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a1fb3593871a17ca89d500055261327dd4ecea9cf65371f5ee6ce0ee5d97e0b +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_10-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b5d7c7dcd31975af564d9bb70cf4ae73b5af7bb --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfa51f9acdc61ccbc9955414cda23215028f54e8027823b66cd76c3068004f28 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_10-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e668e698b5dda0c4470f3058db7762c2537edbe --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be3a9f4613606af8b4bbde19767293564e03c4dde3b5db356e2e05ca044c15ff +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_11-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e663aaa4e2c09cff82f03fb879cb7f8dd6bcee8d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa8dd2fb54b52f97f1a0bb9f79bc4f6f777d7c8219b6404abd733b71b46b7bd +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_11-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d8cc0e760525f7d670023e11b33911f75f8ec54 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050d69c989e2e47d793b3f213912252154d54e4a6b1d77193ac43d9a81b3c8ea +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_12-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd2d00d14f04c863e22179281c0bbc8bf8d72024 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ba812bcffa395ecf990d0f2da9dcda27d69277bb3c29c4950ff1ca466793afd +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_12-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1982385c6838700bf98683ce775b1b95930d10ce --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc5b2b45b6fef4a901e387c6f184e51b9f44d8612d73c2048e5e9c28c2b22b18 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_13-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a891410ca91a429968a0e031943610cbaf39f069 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64a9a62a91ab7d799d7fa6646778ca8fa7728a4e8f5d0c6f08c9d66e0d522890 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_13-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01eb8abefab299217f7c79c710471f6f53897f2a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a508f92b9f2122bf929c440304df4525b287f38de7f8a620ebf2a316c5ca5c2 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_14-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dea7c8e2ea311228a06995e9d1bd32504e191eaa --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0d1c00d1be44006fb26bc20758257f2b7e18d470f011d9732759dcb44292f98 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_14-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61dc5dbe4bac4cc5e6fda69e6b8639be9938e28e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6ec24a59d5a29262fddcdb02dae109e43c33083f953a2af97280f612544396e +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_15-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1339ec7d398f6ed83a61e430d7ec988eb6c4cb82 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efa53c0a740bd181c4b752a99af3c3880c1cebad77b803649f177f923c3bc504 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_15-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..768d35946d4353ab87406cbc4bca3a101aa4f93f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:550151d8cbadc853f7acdcb5a4f9d2f36ced043b33ace9b44fee83159edec3e7 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_16-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e206186ebddf3c19122782410e067251fd152d46 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20b82ac24b8308d080a1fa299a90e8ebd2ca301b05e80454410d661a34a2127b +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_16-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ad8c7986f8bb6ef702c672cc17704a78e51979e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1c1268a9cdb3d39d6881a40928cada1e2a7c76ac8499dc442185b44b655e43c +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_17-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9bed09580bd983a270285b90f3ef6faeb988c23 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e15dd5d69f2a3dbe91b3c9c5d59d42970cabab6ada22ea0f77501d37fe145ac8 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_17-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d5d862d85b3d9f3cc5f5fa1da3a4ab15122214d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57493c681bb44ca2aa5fb6ddc855282239757c2812bc7e22abc55bd16947212f +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_18-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65e28db774de8868ef3f95e702102e57248541c7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cf0e07f1fc08e126fb198ea4d7d31d8f4f0a65dadc028186cd1fc70e98c2a9e +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_18-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc6aeb6840d0c0932c9001425ec3806f6d69a675 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fefa0b18cccff5fd0af36013a16bebf07eac2362426a377a4d442cb84b7a07cf +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_19-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0913802e4755720135f8ee794a191b86d71e50cc --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90336b283f84726e8a9ef70c319c03f13ed4b88a898c0c6874c53b52ee9bdacc +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_19-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..065c4add26c4c65b74c28769983df5d76527b290 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96494ca64ba11360821949963a84e57ce393dec6ffbb05feb3a50f41e091de73 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_20-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a71a1fcd50b682e5b0f2637c4580b7b2bc9ac3d5 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5e7d4e7feaa99f2102d13f6ea49ad7a0f7f275723bd47dae97682078643207d +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_20-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cd13dec71da048fafa7df4558568d72d7519d75 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aab44c5e2ed325f7b00953318ceaa34e0bef8c69bff46530e24e1441e38eab42 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_21-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8489fb7514eedec71d9304f2a7b789a874f90d9a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1687eb69ccdc1e32c5a010422a5bb996c8c4254625a150077692eba472640ae +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_21-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a41628120e88fd5a7ad93d3d14a1f2dac5cb0bb --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a83a0644fa5186f9b8d16063111841e219bf4e66c5f2927e197c99f99760463 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_22-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..768b6c06c188278c0cb2e4e2b0ed16a6fa79058e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f982e36b5c167d1dec0a051f4291bb8ea61d218a7966afa9d2991b6c4c20045 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_22-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0385e679fef1254609f4d5556d1bc712fb260145 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:19377d7e5ba0fc7282e96c055f7a262d5e9accccfdfc76b1d6e57be78fb0c3be +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_23-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7f2747f30598c23780cffdc1fd2f34848bfc80a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3845cd7afe4ec513b29870eeb8b406a6d6c9143684a7c433b9dce2bd1ecf5418 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_23-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fef7c90b8a09f962772a4e447b4b2ff097e336f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f635e53764bdbea32f245b51a96f3a3aa949695bc5bf5cb886ce0321fc7a90d7 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_24-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f207741a3b6ba7f74db59fe8c7b0fe5d4f4fe05d --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f34017cd265a96a0af9219b4a3ee7c614caaff424ce498b3b0222608384fb19 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_24-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0952db84d074a0ee2dda074933f5c8273d84a22 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054770679f915d1b6e4b77b4abc86eb30c07bb291ac122109acb59ce4ba4722e +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_25-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e30c910d7255a566102a0b2d1b1147b8c3836f4 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b739b20fa9b7887fb2ef3634354659d583d03c89bcc61b846d4870294caf76f +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_25-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2864dc6d780feff8820f18fd1a83a5f4d4b48c2f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de03208e15474733d8a19e57732aa5e6d70ee3cd02fa10ba7277c7ef341aca36 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_26-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9353866a4ab38ad6928080da9fa5ab38dfb66ac1 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b3c63570729ff7703e5d7aa36af265b8dafe5fb895e63ac77e056fafb90c155 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_26-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ff9db42c9c95bb93e85069b34553db29587c68f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35cbddec664a2c52eed0af68914d73e550842f74a403e03b7ab6c4f255161d37 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_27-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..912faca1ff612d52fd4801530d8f9c78f1392a4e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcfa88f51293f0acb541cb5164f7e544c7531b5e4c0ae18b3259a49aee1233e5 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_27-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bd09a6abf33b6dcb89219eae2d9ea4040815d5a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:662cbf9889b157b9d41c31f084f0350e333d6ff480388eeff185624d23f49a03 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_28-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..980a876f85583b92c5cfd09fb117496a05afe516 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf159fa0e44c892a03d92d25fc940177d9a59251f0cf0aea87202d79b21b34d5 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_28-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02242521573fb67f11dbc2ae6677a1c25e439789 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ac00924122315cf6713255e30a0f789c78bd560ceff0f16020afb203308a569 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_29-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f42440f5326d7d0ac7642d6cbd4701e526abe4e9 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a0d2c7782c491458f6d4ded553cc623dfa245546e49c4b357075eac36f4b58d +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_29-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..176c5144b19f0d3ee586054151b7966dd65f493f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87b9cfe2670bcefcf1a2b10bb049a2b9fc163cde7ed1a51bb9770405984eab95 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_30-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76662fa60972dda0b8c6f5057dfb8fe622bb84d6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85465d520be8bd558f61fbd85afcce5982e5b7f4cd5df2908b7b195d24c662e3 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_30-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a985bcaf2253c7b7ff94edbc7b008456ccd90cb7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c426b2ab183fc5d9f7b24b80d5c9edfa2b76d0ccba24cb2b53141b33d85ba293 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_31-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..638883ade2d90e15c2f4d22d99f2360552c7155e --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2bac41ae97afb8f64a5a9ecdddab7d0dd9746a97c8f86b07aa0b254dcd1fae0 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_31-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..521761634475f9efb078a0bbce03a51caf2fe280 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6de119fd19a49c830769b0303cea98713efbc7f7d06a2c4998a7c37b07f2cb63 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_32-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62c2744084534d5a98a26710b30566d337c7dfe4 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6298f378f14d9c6b31a8281a02335aed40e9618d3644885d32278031a92ccbf4 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_32-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7dd536b944fe77ba92f86cc7afe4634de996e7d7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad56ebd3db58e68dd3a0749b6ba3c56b2d275d4f4e01a25f4145cbe4a0976d09 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_33-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0296d0be508479ff5d4110caa5652a56ce5813c --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b6866fb93257b64cff57c833089a19e8964ac1fab9e6486b1730f8fe1bb8f58 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_33-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa9c86dfcf63d1131b147e5eec768d8928b5a24f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7393c3873ee7abd30729a5add69e3a28d43d14b746769c68e11055a2924cd4b +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_34-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62b0738730ca19d3ab2dcb6919794cb6641588d7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf70a1259f74c5fd46bad60c1545b323b482e76483515ce49dd7172374acd57c +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_34-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a49a2f4d9f2070a3abfc96092f30f5916ff622a --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a60cb381a0d27fb35e460f316ff14ec3b917c3666cb1f1cba115ce7281a9ddb3 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_35-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..420b2119fc4e3bbdcca6b44d8818e60fd8f67fd6 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5910218df768e758c5b8b85cc06791037016cd34e29c16feedc72dccf66c6a11 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_35-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7da388861c6de801aa1e9632a88f0e6f9cced7a0 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:635af35dca42dd813f4bb4cb85bdc541b66142a165af619f5e1448098d43f92e +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_36-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce3c73ed8220df656f8614cce1a0747c747b8a1 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99841e78c118ecdcd41d6996ae4897ce792c63e02cac7c71ab2a3c0842c24c8 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_36-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..363268e360b3dac46237ab447181295ae282355f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:986f94a2d1e9a4c6651e015f3ee45e468273c47e4d2753582776a5adff949cc2 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_37-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7607ed7fad561ae76394436fcaa19969cbe49b2f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:130b00c8aca492c663f9ba1db74689dc61028dd1e56231dde856afd4768f691f +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_37-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da07de12e804387fd9d340744e92af4921c7c5f2 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee0e3afadbd971f2e7154ada466bdec800624a8299c199bd0024af8ce21ae406 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_38-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dec9a38d6b501da52ea151691447538d3433ddd --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25b79155085fa68f33059b19ad7bb3ab09d463e6d6021c81cf11ce3aa82a343 +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_38-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c80d378009a843c6813ae70ab6c4ed22742e7c7 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d87f5f88bf2c334579e718027b48f4a69c5558d03bbbdbb2363471d5f4cdc95f +size 113308931 diff --git a/4b284b1b9c4seed3/global_step80108/layer_40-model_00-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0d2bb758e73e80e187104fb3751ab3c095d8c4b --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a65d183cac99800b4a6c9e34789fec628d3434eaeadd3e971404fb663ba03e5 +size 13507 diff --git a/4b284b1b9c4seed3/global_step80108/layer_40-model_01-model_states.pt b/4b284b1b9c4seed3/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a21e2c509c2a1f77b72dc33f29d7b11719adffbc --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:450391fd0fae9e6218b6a316cad0be3216fd3c884f7f87e2fd06c0d4e6ff9150 +size 13507 diff --git a/4b284b1b9c4seed3/global_step80108/mp_rank_00_model_states.pt b/4b284b1b9c4seed3/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59ca8263ae824970254218f59917635fc14e260f --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ed9fcbdbdd370d35d19debea31ad2a0e72059ac70db66f64b540a4d9eb0f995 +size 51507 diff --git a/4b284b1b9c4seed3/global_step80108/mp_rank_01_model_states.pt b/4b284b1b9c4seed3/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..248e42787f97ef28694b17a316a15f99253f57b3 --- /dev/null +++ b/4b284b1b9c4seed3/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3a079ff3836ca32c6c17b6d17070985d162d317eacd11d66c74d91250a268c3 +size 51507 diff --git a/4b284b1b9c4seed3/transformers/config.json b/4b284b1b9c4seed3/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b1b9c4seed3/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b1b9c4seed3/transformers/pytorch_model.bin b/4b284b1b9c4seed3/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..eda394afafb397e83cdbbb739530f09547fb0ba2 --- /dev/null +++ b/4b284b1b9c4seed3/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caebeb9572b5bee2c5cc85c4f31fd2f141075c0e3fecf4c8252c9c14e2fb6a4b +size 8781203669 diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1655ce39c4839a6d99e5f19e8e00d3664de3f6c2 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.26787629279095865, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02421388470865588}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.053140729220499526, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001447561888642144}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2650539620149166, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004611089062355459}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.07916714595011602, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0016165914559961}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.021704917896300822, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009077529999546599}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.10624239698539174, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0029454877090427634}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.03206245161358705, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009944025304645106}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.04859565080529351, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013030805071960487}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24447365028169235, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0042597620469032324}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.07256452976899888, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014455163882477753}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.04911887572948648, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013308973848181627}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.24529807807313986, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004231057274690599}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07317950398891415, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014738730467798152}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cc7a4f2bfb6c8f8be585f0e0e2f258e434a7497d --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.27346154994880517, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02188738307683954}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.047626171506349936, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011352906867889128}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.26035399188160574, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004602505397267029}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.07424112149389747, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0013991731147740165}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.01795733317688481, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006207760872719163}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.10255465178172037, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0028918136354984434}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.028108438388606747, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008209525600219419}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.04253166976477524, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0009520378507813956}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.23570739197296856, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004138563159116714}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.06664007036780817, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001225946991287631}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.044154443741561675, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0010805238879022037}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.24018067638000298, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004203191799368478}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.06858259906736544, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001295048790148881}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5da6e042f543f2046026688330efe106dc9c175d --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.28354223508209625, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02196438336730763}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.04907071394368477, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0011814228439300668}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2717922146470884, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004679127784588707}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.077057196050893, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001405552196581262}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.01847026867964925, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006271549211076853}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.10837787945721133, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00292786577048572}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.029195418367829688, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008404145834110129}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.043547243362200026, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0010632111900203151}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24217304687370458, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0041386950242398935}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.0683478121462329, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001219408641805486}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.04538438937137174, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0010999742522302452}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2509319606971942, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004265166783401968}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07117154749767428, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001278540354605195}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..3edb3fe581958814fc57d2707f3123366f3aac04 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.26231700778830913, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.01677381795342571}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.048773010954172226, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010801404950998403}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.2723524322573744, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004614644088480283}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.07701202526647727, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0013264916492560968}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.01830389408829641, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000765761231033471}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.10724024189536346, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0029417688916459905}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.028476680174906326, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007831062590315599}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.04285349136828219, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0009848666531091866}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.23931793383909106, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0039933449779696656}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.06751038060872314, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0011522535843318086}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.045262801919532414, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001021866086917732}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25210574997713586, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004210876653447827}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.0713319417621141, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0012205962369251139}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6fbbfef1fccbe6b49ea186db7e4f475df8b5954b --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.2909737297069181, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.016893325417647067}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.05081036279065346, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001340290442932179}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.27689930067824825, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004592552339097503}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.07880513839875916, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0013577530127801877}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.02000297688991883, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009665376160012339}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1098959472411629, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0029265187187869925}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.029911000513183756, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008104665489277981}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.04469978216410197, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001228415770141008}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.24325022171643784, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003959401381097609}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.06910981407367636, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001165837956941959}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.047479319186822515, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012835127261851631}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25785008091098, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004217817751472416}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07342750134261251, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0012548900975791317}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..18a011b6a2cf4ba97c7e38dadd39762f655feb84 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.275592913998383, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.010675634701516879}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.050188036684923054, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010589097851446405}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.28261873177986385, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004706167216581722}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.07936270839708998, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0013461361721732127}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.018414057787839, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005667544666951426}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.11149049346375932, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002957507274568516}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.029335540062254653, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00077573226541773}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.04348160210158506, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0009025307067376957}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2468060892224703, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004013696328255729}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.06878175079936166, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0011305052098162837}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.046368846883703685, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0009967098378676012}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.25991163700009623, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0042359736213800495}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.07315850261422062, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0012299656434355821}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..6a7d8fe4e0786e5a514bf20bf35dde9472def9e6 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1508638357497856, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019477340479700028}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.24849466528414227, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025701642988402284}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17351939045996323, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018292808999788056}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.028565167813151382, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007213658899061881}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04860070927724722, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012792940293872988}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.033112770233475294, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007842583345225733}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11205417400994366, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001364543594879335}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19083146969499562, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020249121235725457}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1300215852768387, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012668686976567704}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14039987541721508, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001794428495675629}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23240706811113432, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002406095416292502}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16176041579500514, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016905736140852296}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.4498797804800554, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.030033155430787307}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a4ed339da3bef7ebac788dfc2739ce5e8850546d --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1526735082069478, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001954192368311485}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2537630901501927, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025247263534353263}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17598744290815144, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001808190292239866}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.02844271878006758, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007501808391968073}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.048050899811526195, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013077335984725508}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.032548106421086444, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007854290741659407}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11085969871259992, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013092492625755249}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1910548183701386, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0019406911815812453}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1291623611792601, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012144030507005796}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14352989085571205, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018308845070724087}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23982592472606548, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024037588777864357}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1656292822984552, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016884673231307584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5523030824089203, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0404745781112937}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..11efe666b36e96fc7b206a9046bf6759d78435f7 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15614318865894197, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001953522003890445}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2564233598947695, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002443975404517576}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17851912473986262, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017588268154772792}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.028786254184172754, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007381734830468564}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04721098878117776, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0012484536682449941}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.032531974500306655, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007707378614567543}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11436547586059817, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013634627836511027}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19403348190827804, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.001915506475404068}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13175959208331914, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00119267469976916}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14706172179649213, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018475712783318878}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24190155350034248, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023184025713278256}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16809587331436024, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001653116049291498}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5504469719150438, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.046981957687555205}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..21da82ee2c89afc756fde3d9325fea63d179c864 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.13699405852667912, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022271962965683227}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.21313164031151458, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028175993079765913}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.14977645750144936, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00199726722683507}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.025286085868956577, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007388515719204758}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.04046828319806029, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001196737089891652}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.027873427098971903, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0007427085100927844}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10087113357194523, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016060316815470442}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1621097484851492, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021946464603937125}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.11096435645199118, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014009503741229052}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1288247035213342, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020910254870389346}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2007771126062864, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026617775847568633}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1408419182005074, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018690086358082113}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.6506772563162972, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07202666343435976}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..e87fef1702c1e24a4fe5ce7a7b5c864f99ea91b4 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.04727049455418174, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018100262381206956}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07308789496556233, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002548253609808092}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.04990479829313592, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017225289026089794}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.009152769715333476, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005809882470945591}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.014793686682183805, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0008871836496692909}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.009704784607524384, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005246010118344956}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.03634445955852837, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014097418513319498}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.05712304517098294, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002020929141181275}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.038102997687537214, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012904657107170763}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.04450904725651575, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017072089167818546}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.06907832245228929, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002416204133617309}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.04692854753900321, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001615455808763454}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.35442363598057186, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02957890609663373}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b9101990d813ca7401222f0b60ded80add482567 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.007806943563100253, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008029596223294583}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.011916878778381854, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0011710685254217557}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.007934022472178462, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007646898711388704}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0015499616053509758, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00024432717225911417}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0022995865319653413, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00033582149369530104}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0014852201283601309, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00020361223200698468}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006059612662075617, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006187644415825575}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.009361683565350928, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009310373409583372}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006092063289579814, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005734478033484189}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.0073509618326022316, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007548623257902688}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.011247516251388902, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.001102260125459754}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.007474906777946338, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007195818405089297}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.3773909381181067e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 6.777702484631335e-07}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a91dcdffe070d765d3177d69e045995df40a6529 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.8482338536273092, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06579534941253831}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.03689992434617125, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00143080390296388}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.03176166527004807, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0015278801549138494}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.029524410502349083, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0012194408459950685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.005295864917355121, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000436477995087522}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.008570227243564495, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0006945659775254231}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.006282252522560226, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005083233271996686}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.034035125364177875, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013033143404442467}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.02894660702654024, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0013685312959876327}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.02704266874243934, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001092799039388727}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.034329573061074765, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013151068156701008}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.028756511365956524, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0013753740219635173}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.027093010874833397, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0011035568012963972}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ed8a2de8501992f2c5cda271c0bd0b51e1b08b42 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 5.942260098167613, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09441092756090216}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3146822903840917, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026228566349168303}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4073067647472486, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002694916559116025}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3304930105126096, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020464079472463886}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.11973672411480318, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017049415225723842}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.15858199335292084, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001880021556117094}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.12621157789802925, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00144122341707661}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.23121444753390857, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019617352937841724}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.30603012289790815, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002249710012043417}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.24390496755077615, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014758735639314516}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.26253682646143983, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0023660383137224746}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.33971109353202855, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002493554468070354}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.27519248986257294, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018786355388105225}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..5d6f4b2c8075710e93b228074016aaacb46e2185 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.725052864934353, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14629714654304157}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3370432420794776, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0029582437787025427}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.41475409018206294, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002581973755669344}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3455500221300751, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020567847742166303}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.13924246863995587, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018935171496830272}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.17241918013486687, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019222974911274624}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.14215332459928473, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015526430769182552}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.25285247263136995, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002281200773310861}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.31635151085258584, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002181518712740274}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.26044817619281624, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015920982446906947}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.28533453436961675, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0026174427606121924}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.35223597019269687, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002458693422243018}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.29316637284801744, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019474180340165936}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..475d1cc8794e60d90e2a97f2a7fbbc2d307d571d --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.973175823947467, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08432471729881086}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3372869158678504, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002968659112264888}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.41917585622339343, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0024657865682947604}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3491442563303595, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002084406661790611}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.1451623356626606, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001878882685675287}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1805945511839357, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001899662372461791}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.14925241670212142, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015639781562393712}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.25377095839457386, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0023013165756289485}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.31994498910057845, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020988836643955253}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2637903997625913, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016349236936735077}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2861590985165946, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0026614220152062383}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.35633299447456107, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00237175789815616}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.29641103594998963, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019700089086597617}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b3748fd9b39e36955f31bd4994d4f85751b63291 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.781202241557229, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11394876149110739}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3287498306441592, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002864037922185099}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4242438979853323, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002418778880597351}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.34660270706267965, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002015167448860447}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.14188074782669924, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018111547132663394}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.18330145095889133, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001867227120259638}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1484646710112249, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015009486601977229}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.24760447580397063, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002205771870408524}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3245629843061881, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002091486936788564}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2623953647532703, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015873390211834876}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2799336817988539, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025898070057799047}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.36159803652552097, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002354029382709626}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.2952178835224044, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019315028392222534}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..bb864417c500068cb578ce88284b00d34e06c283 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.685901964010736, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1354495963808724}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.32176357670299083, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0027967903182063224}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4272486932644093, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0023809505635255927}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3437737218331649, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019546229382639466}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.13815978485481578, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017518294091340995}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.18494316023841778, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018444532176795417}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.14683833434343727, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014540710021065215}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2417191397949724, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00214960916866614}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32601659789964693, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020925727851936926}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2596864980022702, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015675414220731314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.27513062879919625, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025215646737994962}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3659104174188377, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023445078388895997}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.29423382905586287, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018901601807881775}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_0.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3efcc549ee02f83cdd0cabf449e66ea4b0025641 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.14337493474921045, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018970632275809294}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.32850970396744716, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0039197450040575135}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.19381060522505453, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022326458513688033}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.027496214834546444, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001054159884756719}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06556453127883762, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023771544908032247}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03756311678020454, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001356763612763011}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.10679400111516424, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014304369917064012}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2459644623091805, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002986298895539128}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.14442948981860032, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016582345165837742}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.11360184621025315, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015482924171113445}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26296431121251945, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003409100925773213}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15408798170242552, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018796051363025486}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.445573424695658, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15425934770761948}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_1.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..55322e9022631b9dd6be7ca49d89e5e3e8edcf2b --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10765659328853563, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015212603420465503}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2657263624255442, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0033066001915549596}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1513724503049335, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020050978617654432}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.013942450754043968, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006842372730185846}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.03481401056485645, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016493879352824244}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.01966067423050901, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009461105744381743}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08261246482339596, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011168888732104218}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.20552675444508914, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025401789847852084}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11639992980160706, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014853662011968952}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08719479126054427, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012099004109665159}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.21714465186994203, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027534050196141966}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12287565931519653, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016075317103237032}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.6954014401170389, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0939232317796097}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_2.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..db50a1757e5aef2ed869552800b0f07719210991 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10867457736153135, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001495555344909094}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.27143929169611797, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003394856674159156}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.15344534516159183, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020053949533959292}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01507662196122561, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006861991351095634}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.03867163671633521, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017747285897281744}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.02144461765365429, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009703360723919554}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08378473061167403, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011056093599254957}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.21115579128906609, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002637225983534165}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11854204244373989, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014924813777114118}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08877022608536633, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012265040039533249}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22324911827513313, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0029138573801630453}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12557130842107206, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016648364713290837}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7307303414586408, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06155547874417727}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_3.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..b782a586d1617d6b5d55e7c043b99126e0fd9a94 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.10592564096937784, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017525879317443233}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2539427012445784, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003731447303357977}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1459946014022398, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002181990692411414}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01420534449614851, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007006470449943444}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.03590630051582267, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0017733541653792099}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.020061440587479485, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009777698919290968}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08153731863940099, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012887659869021155}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.19693769942475764, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002869678698254578}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.11265406503599139, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001630908636011174}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.08628916736533274, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013712543798638922}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2081960052350543, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030602079181311892}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.11915978365542443, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017414042260366922}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.7723989217062374, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07506332455732345}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_4.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..aeb6689cb46278abf7a9b2ac9fea5c7cd72e8195 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.034471583104804415, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002238315408267895}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.06381728541655798, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0036282870714125083}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.040215681107462056, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002237517556474153}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.003871537312889549, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005719133532575095}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.008269838331766569, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0009564670794954605}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.004935566104695442, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005753566907154545}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.026758973645767164, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018801400712648681}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.04838251241637687, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0027529301388328257}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.030441951036000715, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016864228566178527}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.028758380610237905, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0019838383896546154}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.052394609604491466, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00300800960671939}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03296335745988539, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001842268360788242}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.4202554532269484, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12262307961277104}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_5.json b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d054c009978f3ac33e77819bb8bee0343bdb1754 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/agg.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.002427203615941276, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0006831484429133202}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0019840191933539033, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0005303913662852268}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002135746093866511, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0005838656686162581}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0003678072143665929, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00015846001855024936}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0002682301974754805, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0001131215031105469}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00030743447999977873, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00013023642706646356}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0019066685986482705, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005793006239621258}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.001578844696073063, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00044617009211618964}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.001686259301474979, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0004921843202278661}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0019704357925048386, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0005792873025022089}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.00161831401010321, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0004437097896608957}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.001735086296720847, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0004903196095708464}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.2660127317243813e-38, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 3.8267567150622576e-33}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b860e3c7525766dbff440198b2a5712b20d5ca58 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6af9b61c38ace69a921e6e0568b24c9ba8e5d1c4ce3718de510dcd44d0215797 +size 4181352 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e1e4e43b785a46e4fc0a01897465579f50a4325f --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:680747c735f9ba030ea9bcf7abe3a3f8b4bfa85f9c2ba63b165c54fc561be1c4 +size 5103587 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..401c9089ba502a1384ee0495663becf22d0ed7f0 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eff3e9dab51d3a469d42f027dc251d0e926f6ec1f27bbb6e7e8fdbdd3bec17ac +size 5990289 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dfb4b2d5a06fdffea4e931aa87ab3987574faf89 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69ffaffad3083622f51b749bc16f7ab99da11dc988e9c933d4e84ef6e4904638 +size 6890235 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7d90db3e472fdc30cad737684c325211dd046781 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c78aac03e293c69f4aad44f6aa7a58aa085d309329a83d3d9cce4dec137678e +size 7799337 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2de251db8fb7f4ae117d6d62e623666f5f10df8c --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df853bd34a571a41475c1fdbaf56ccb3c56d415ad5eeb84fe259e8e16232666c +size 8699057 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..06ebe3f13766bdf32b8a58a1c18e23002c937295 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9594040f14a1d8a4ba0603321512f90bce2304b27e327546b857390f5c9d6d6 +size 7677455 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8cb28e74760d354a3bc165d0fe06874666c28d9f --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f54fb85ebab6f157b77f0dbdcbaaa1aa5084642f34d974519bdcb68ba65b0e7 +size 13311871 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..89163f0c411d8d711a24915dca52297664004a73 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f50bb7a3f7264ed83002bb1841be0ed85a6dfa8667cdef111b17b46e41bd42f9 +size 18909252 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dc71573355c53ebc574a9804a24d6c04af21b33f --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dcfd98b07b9c4c3bd2faf3320122fb01a87408082cc615277cef1c94722e0f9 +size 24325563 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b7eb865dd45185a3b24ce98f328eb9cfc46f0b8d --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1229e379339be5e6d76cb7754e220ede91ccf77ab672578ff83efe261ce91ce5 +size 29472112 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c380dac742171aae1bc56b9b8ae1384a96ab8b39 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a38e0b4c2bd7b2a584ca7f128156629c679f1c875fef71957b3bfcde34c6a86 +size 34799051 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e23f3ba3f61e1e3a58ea22bcaa16e289d6857286 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21959962b61f3b7bd56b2881e9dfe633cf039ca8ed4230b662e1f78b3d129b23 +size 3811809 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..06081f684ca064d4cf12ebe2cca664ff2d0045e3 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:307a4c36a6906a746e67881f204acb1fb1bc44ff7aa9c905acb08a191f9e6838 +size 5296072 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b45149cfa5b6891d9b852b66097b086e5d0737c3 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2735a119490cd12c8a6aaff45e53bf8678072f04d8306b4ea41111f7a01f3992 +size 6362366 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4e543694950b074c4528d16cba9d524bcc35ea1a --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1db8fa7b48b2f78786f484e088d11725fea55c0fda5b0c38d22ab29d5c0ddea +size 7449326 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b41c453fd5eedd45ff43bc4621df3c1affe44280 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b789ce50dbfd3020c317777c3c7f372fe3ca3a9007ba636fcf8208ec04cbc323 +size 8547189 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fee41870548e38309715525f94733c37b0244af5 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49359e3bb8c063beaafaaadac452a93671d2ab8f14975d5a8dd37defbcc93937 +size 9648168 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_0.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0d850d911700a998435e4e424d265e766099eba0 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17ce4c4f5bf770d8fb4d6de46e3f4c403badbf2e4ead457232b106bc398ad882 +size 2823177 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_1.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4ad721229dfb54906d553fd9a423a919e90cd8cc --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15e482846eb5460d86a6bd9b8a41d431c475ad7a8a6f6bc9ef1bf2ca40633265 +size 5104982 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_2.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e1df247cd20c9d88a0ce382167d447a14c87fb7b --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:069910dabe12ac4c865f70f7ae2841458a93546a2a26247c2b2b3ce285ca06ec +size 7380096 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_3.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a343c93e5d7b46e1efc9622fa40525ece40838bd --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2aad753c1aea16ddcd264811552585d82c33ddc8b95b979e23e2f46f3cf99c8 +size 9648142 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_4.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fd3923e1a990d6ef1267c63a5224fed439c93349 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4157e83f0b23de5f710f63c378ef8a4c9f3ca018e489a861af3066e8e92e0123 +size 11672961 diff --git a/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_5.jsonl b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4c71501b051c613c9f4f6fc0ad6ec8094dcb25c1 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/examples.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1402268d0e5b8aa428630b8c54f1bc66aac501448590f8aa77ea112407df65c3 +size 13897495 diff --git a/4b284b1b9c4seed4/evaluation/generation/merged.csv b/4b284b1b9c4seed4/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..0f78743b72b04f5700250834bfff1bffbfbc4abf --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.006282252522560226 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.006282252522560226 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.12621157789802925 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.12621157789802925 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.14215332459928473 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.14215332459928473 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.14925241670212142 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.14925241670212142 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.1484646710112249 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.1484646710112249 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.14683833434343727 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.14683833434343727 +e2e_nlg_cleaned,5,average,multiple,0.11986709617944297 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.03756311678020454 +gem_xsum,0,median,rouge2_fmeasure,0.03756311678020454 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.01966067423050901 +gem_xsum,1,median,rouge2_fmeasure,0.01966067423050901 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.02144461765365429 +gem_xsum,2,median,rouge2_fmeasure,0.02144461765365429 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.020061440587479485 +gem_xsum,3,median,rouge2_fmeasure,0.020061440587479485 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.004935566104695442 +gem_xsum,4,median,rouge2_fmeasure,0.004935566104695442 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00030743447999977873 +gem_xsum,5,median,rouge2_fmeasure,0.00030743447999977873 +gem_xsum,5,average,multiple,0.017328808306090425 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.03206245161358705 +web_nlg_en,0,median,rouge2_fmeasure,0.03206245161358705 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.028108438388606747 +web_nlg_en,1,median,rouge2_fmeasure,0.028108438388606747 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.029195418367829688 +web_nlg_en,2,median,rouge2_fmeasure,0.029195418367829688 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.028476680174906326 +web_nlg_en,3,median,rouge2_fmeasure,0.028476680174906326 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.029911000513183756 +web_nlg_en,4,median,rouge2_fmeasure,0.029911000513183756 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.029335540062254653 +web_nlg_en,5,median,rouge2_fmeasure,0.029335540062254653 +web_nlg_en,5,average,multiple,0.02951492152006137 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.033112770233475294 +wiki_lingua_en,0,median,rouge2_fmeasure,0.033112770233475294 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.032548106421086444 +wiki_lingua_en,1,median,rouge2_fmeasure,0.032548106421086444 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.032531974500306655 +wiki_lingua_en,2,median,rouge2_fmeasure,0.032531974500306655 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.027873427098971903 +wiki_lingua_en,3,median,rouge2_fmeasure,0.027873427098971903 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.009704784607524384 +wiki_lingua_en,4,median,rouge2_fmeasure,0.009704784607524384 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0014852201283601309 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0014852201283601309 +wiki_lingua_en,5,average,multiple,0.022876047164954134 diff --git a/4b284b1b9c4seed4/evaluation/generation/merged.json b/4b284b1b9c4seed4/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..a68448d8e94c819094a60b5fc1888a9874709d3d --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.26787629279095865, "bleu_stderr": 0.02421388470865588, "rouge1_fmeasure": 0.07916714595011602, "rouge1_fmeasure_stderr": 0.0016165914559961, "rouge1_precision": 0.053140729220499526, "rouge1_precision_stderr": 0.001447561888642144, "rouge1_recall": 0.2650539620149166, "rouge1_recall_stderr": 0.004611089062355459, "rouge2_fmeasure": 0.03206245161358705, "rouge2_fmeasure_stderr": 0.0009944025304645106, "rouge2_precision": 0.021704917896300822, "rouge2_precision_stderr": 0.0009077529999546599, "rouge2_recall": 0.10624239698539174, "rouge2_recall_stderr": 0.0029454877090427634, "rougeL_fmeasure": 0.07256452976899888, "rougeL_fmeasure_stderr": 0.0014455163882477753, "rougeL_precision": 0.04859565080529351, "rougeL_precision_stderr": 0.0013030805071960487, "rougeL_recall": 0.24447365028169235, "rougeL_recall_stderr": 0.0042597620469032324, "rougeLsum_fmeasure": 0.07317950398891415, "rougeLsum_fmeasure_stderr": 0.0014738730467798152, "rougeLsum_precision": 0.04911887572948648, "rougeLsum_precision_stderr": 0.0013308973848181627, "rougeLsum_recall": 0.24529807807313986, "rougeLsum_recall_stderr": 0.004231057274690599}}, "1": {"PALM_prompt": {"bleu": 0.27346154994880517, "bleu_stderr": 0.02188738307683954, "rouge1_fmeasure": 0.07424112149389747, "rouge1_fmeasure_stderr": 0.0013991731147740165, "rouge1_precision": 0.047626171506349936, "rouge1_precision_stderr": 0.0011352906867889128, "rouge1_recall": 0.26035399188160574, "rouge1_recall_stderr": 0.004602505397267029, "rouge2_fmeasure": 0.028108438388606747, "rouge2_fmeasure_stderr": 0.0008209525600219419, "rouge2_precision": 0.01795733317688481, "rouge2_precision_stderr": 0.0006207760872719163, "rouge2_recall": 0.10255465178172037, "rouge2_recall_stderr": 0.0028918136354984434, "rougeL_fmeasure": 0.06664007036780817, "rougeL_fmeasure_stderr": 0.001225946991287631, "rougeL_precision": 0.04253166976477524, "rougeL_precision_stderr": 0.0009520378507813956, "rougeL_recall": 0.23570739197296856, "rougeL_recall_stderr": 0.004138563159116714, "rougeLsum_fmeasure": 0.06858259906736544, "rougeLsum_fmeasure_stderr": 0.001295048790148881, "rougeLsum_precision": 0.044154443741561675, "rougeLsum_precision_stderr": 0.0010805238879022037, "rougeLsum_recall": 0.24018067638000298, "rougeLsum_recall_stderr": 0.004203191799368478}}, "2": {"PALM_prompt": {"bleu": 0.28354223508209625, "bleu_stderr": 0.02196438336730763, "rouge1_fmeasure": 0.077057196050893, "rouge1_fmeasure_stderr": 0.001405552196581262, "rouge1_precision": 0.04907071394368477, "rouge1_precision_stderr": 0.0011814228439300668, "rouge1_recall": 0.2717922146470884, "rouge1_recall_stderr": 0.004679127784588707, "rouge2_fmeasure": 0.029195418367829688, "rouge2_fmeasure_stderr": 0.0008404145834110129, "rouge2_precision": 0.01847026867964925, "rouge2_precision_stderr": 0.0006271549211076853, "rouge2_recall": 0.10837787945721133, "rouge2_recall_stderr": 0.00292786577048572, "rougeL_fmeasure": 0.0683478121462329, "rougeL_fmeasure_stderr": 0.001219408641805486, "rougeL_precision": 0.043547243362200026, "rougeL_precision_stderr": 0.0010632111900203151, "rougeL_recall": 0.24217304687370458, "rougeL_recall_stderr": 0.0041386950242398935, "rougeLsum_fmeasure": 0.07117154749767428, "rougeLsum_fmeasure_stderr": 0.001278540354605195, "rougeLsum_precision": 0.04538438937137174, "rougeLsum_precision_stderr": 0.0010999742522302452, "rougeLsum_recall": 0.2509319606971942, "rougeLsum_recall_stderr": 0.004265166783401968}}, "3": {"PALM_prompt": {"bleu": 0.26231700778830913, "bleu_stderr": 0.01677381795342571, "rouge1_fmeasure": 0.07701202526647727, "rouge1_fmeasure_stderr": 0.0013264916492560968, "rouge1_precision": 0.048773010954172226, "rouge1_precision_stderr": 0.0010801404950998403, "rouge1_recall": 0.2723524322573744, "rouge1_recall_stderr": 0.004614644088480283, "rouge2_fmeasure": 0.028476680174906326, "rouge2_fmeasure_stderr": 0.0007831062590315599, "rouge2_precision": 0.01830389408829641, "rouge2_precision_stderr": 0.000765761231033471, "rouge2_recall": 0.10724024189536346, "rouge2_recall_stderr": 0.0029417688916459905, "rougeL_fmeasure": 0.06751038060872314, "rougeL_fmeasure_stderr": 0.0011522535843318086, "rougeL_precision": 0.04285349136828219, "rougeL_precision_stderr": 0.0009848666531091866, "rougeL_recall": 0.23931793383909106, "rougeL_recall_stderr": 0.0039933449779696656, "rougeLsum_fmeasure": 0.0713319417621141, "rougeLsum_fmeasure_stderr": 0.0012205962369251139, "rougeLsum_precision": 0.045262801919532414, "rougeLsum_precision_stderr": 0.001021866086917732, "rougeLsum_recall": 0.25210574997713586, "rougeLsum_recall_stderr": 0.004210876653447827}}, "4": {"PALM_prompt": {"bleu": 0.2909737297069181, "bleu_stderr": 0.016893325417647067, "rouge1_fmeasure": 0.07880513839875916, "rouge1_fmeasure_stderr": 0.0013577530127801877, "rouge1_precision": 0.05081036279065346, "rouge1_precision_stderr": 0.001340290442932179, "rouge1_recall": 0.27689930067824825, "rouge1_recall_stderr": 0.004592552339097503, "rouge2_fmeasure": 0.029911000513183756, "rouge2_fmeasure_stderr": 0.0008104665489277981, "rouge2_precision": 0.02000297688991883, "rouge2_precision_stderr": 0.0009665376160012339, "rouge2_recall": 0.1098959472411629, "rouge2_recall_stderr": 0.0029265187187869925, "rougeL_fmeasure": 0.06910981407367636, "rougeL_fmeasure_stderr": 0.001165837956941959, "rougeL_precision": 0.04469978216410197, "rougeL_precision_stderr": 0.001228415770141008, "rougeL_recall": 0.24325022171643784, "rougeL_recall_stderr": 0.003959401381097609, "rougeLsum_fmeasure": 0.07342750134261251, "rougeLsum_fmeasure_stderr": 0.0012548900975791317, "rougeLsum_precision": 0.047479319186822515, "rougeLsum_precision_stderr": 0.0012835127261851631, "rougeLsum_recall": 0.25785008091098, "rougeLsum_recall_stderr": 0.004217817751472416}}, "5": {"PALM_prompt": {"bleu": 0.275592913998383, "bleu_stderr": 0.010675634701516879, "rouge1_fmeasure": 0.07936270839708998, "rouge1_fmeasure_stderr": 0.0013461361721732127, "rouge1_precision": 0.050188036684923054, "rouge1_precision_stderr": 0.0010589097851446405, "rouge1_recall": 0.28261873177986385, "rouge1_recall_stderr": 0.004706167216581722, "rouge2_fmeasure": 0.029335540062254653, "rouge2_fmeasure_stderr": 0.00077573226541773, "rouge2_precision": 0.018414057787839, "rouge2_precision_stderr": 0.0005667544666951426, "rouge2_recall": 0.11149049346375932, "rouge2_recall_stderr": 0.002957507274568516, "rougeL_fmeasure": 0.06878175079936166, "rougeL_fmeasure_stderr": 0.0011305052098162837, "rougeL_precision": 0.04348160210158506, "rougeL_precision_stderr": 0.0009025307067376957, "rougeL_recall": 0.2468060892224703, "rougeL_recall_stderr": 0.004013696328255729, "rougeLsum_fmeasure": 0.07315850261422062, "rougeLsum_fmeasure_stderr": 0.0012299656434355821, "rougeLsum_precision": 0.046368846883703685, "rougeLsum_precision_stderr": 0.0009967098378676012, "rougeLsum_recall": 0.25991163700009623, "rougeLsum_recall_stderr": 0.0042359736213800495}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.4498797804800554, "bleu_stderr": 0.030033155430787307, "rouge1_fmeasure": 0.17351939045996323, "rouge1_fmeasure_stderr": 0.0018292808999788056, "rouge1_precision": 0.1508638357497856, "rouge1_precision_stderr": 0.0019477340479700028, "rouge1_recall": 0.24849466528414227, "rouge1_recall_stderr": 0.0025701642988402284, "rouge2_fmeasure": 0.033112770233475294, "rouge2_fmeasure_stderr": 0.0007842583345225733, "rouge2_precision": 0.028565167813151382, "rouge2_precision_stderr": 0.0007213658899061881, "rouge2_recall": 0.04860070927724722, "rouge2_recall_stderr": 0.0012792940293872988, "rougeL_fmeasure": 0.1300215852768387, "rougeL_fmeasure_stderr": 0.0012668686976567704, "rougeL_precision": 0.11205417400994366, "rougeL_precision_stderr": 0.001364543594879335, "rougeL_recall": 0.19083146969499562, "rougeL_recall_stderr": 0.0020249121235725457, "rougeLsum_fmeasure": 0.16176041579500514, "rougeLsum_fmeasure_stderr": 0.0016905736140852296, "rougeLsum_precision": 0.14039987541721508, "rougeLsum_precision_stderr": 0.001794428495675629, "rougeLsum_recall": 0.23240706811113432, "rougeLsum_recall_stderr": 0.002406095416292502}}, "1": {"tldr_en": {"bleu": 1.5523030824089203, "bleu_stderr": 0.0404745781112937, "rouge1_fmeasure": 0.17598744290815144, "rouge1_fmeasure_stderr": 0.001808190292239866, "rouge1_precision": 0.1526735082069478, "rouge1_precision_stderr": 0.001954192368311485, "rouge1_recall": 0.2537630901501927, "rouge1_recall_stderr": 0.0025247263534353263, "rouge2_fmeasure": 0.032548106421086444, "rouge2_fmeasure_stderr": 0.0007854290741659407, "rouge2_precision": 0.02844271878006758, "rouge2_precision_stderr": 0.0007501808391968073, "rouge2_recall": 0.048050899811526195, "rouge2_recall_stderr": 0.0013077335984725508, "rougeL_fmeasure": 0.1291623611792601, "rougeL_fmeasure_stderr": 0.0012144030507005796, "rougeL_precision": 0.11085969871259992, "rougeL_precision_stderr": 0.0013092492625755249, "rougeL_recall": 0.1910548183701386, "rougeL_recall_stderr": 0.0019406911815812453, "rougeLsum_fmeasure": 0.1656292822984552, "rougeLsum_fmeasure_stderr": 0.0016884673231307584, "rougeLsum_precision": 0.14352989085571205, "rougeLsum_precision_stderr": 0.0018308845070724087, "rougeLsum_recall": 0.23982592472606548, "rougeLsum_recall_stderr": 0.0024037588777864357}}, "2": {"tldr_en": {"bleu": 1.5504469719150438, "bleu_stderr": 0.046981957687555205, "rouge1_fmeasure": 0.17851912473986262, "rouge1_fmeasure_stderr": 0.0017588268154772792, "rouge1_precision": 0.15614318865894197, "rouge1_precision_stderr": 0.001953522003890445, "rouge1_recall": 0.2564233598947695, "rouge1_recall_stderr": 0.002443975404517576, "rouge2_fmeasure": 0.032531974500306655, "rouge2_fmeasure_stderr": 0.0007707378614567543, "rouge2_precision": 0.028786254184172754, "rouge2_precision_stderr": 0.0007381734830468564, "rouge2_recall": 0.04721098878117776, "rouge2_recall_stderr": 0.0012484536682449941, "rougeL_fmeasure": 0.13175959208331914, "rougeL_fmeasure_stderr": 0.00119267469976916, "rougeL_precision": 0.11436547586059817, "rougeL_precision_stderr": 0.0013634627836511027, "rougeL_recall": 0.19403348190827804, "rougeL_recall_stderr": 0.001915506475404068, "rougeLsum_fmeasure": 0.16809587331436024, "rougeLsum_fmeasure_stderr": 0.001653116049291498, "rougeLsum_precision": 0.14706172179649213, "rougeLsum_precision_stderr": 0.0018475712783318878, "rougeLsum_recall": 0.24190155350034248, "rougeLsum_recall_stderr": 0.0023184025713278256}}, "3": {"tldr_en": {"bleu": 1.6506772563162972, "bleu_stderr": 0.07202666343435976, "rouge1_fmeasure": 0.14977645750144936, "rouge1_fmeasure_stderr": 0.00199726722683507, "rouge1_precision": 0.13699405852667912, "rouge1_precision_stderr": 0.0022271962965683227, "rouge1_recall": 0.21313164031151458, "rouge1_recall_stderr": 0.0028175993079765913, "rouge2_fmeasure": 0.027873427098971903, "rouge2_fmeasure_stderr": 0.0007427085100927844, "rouge2_precision": 0.025286085868956577, "rouge2_precision_stderr": 0.0007388515719204758, "rouge2_recall": 0.04046828319806029, "rouge2_recall_stderr": 0.001196737089891652, "rougeL_fmeasure": 0.11096435645199118, "rougeL_fmeasure_stderr": 0.0014009503741229052, "rougeL_precision": 0.10087113357194523, "rougeL_precision_stderr": 0.0016060316815470442, "rougeL_recall": 0.1621097484851492, "rougeL_recall_stderr": 0.0021946464603937125, "rougeLsum_fmeasure": 0.1408419182005074, "rougeLsum_fmeasure_stderr": 0.0018690086358082113, "rougeLsum_precision": 0.1288247035213342, "rougeLsum_precision_stderr": 0.0020910254870389346, "rougeLsum_recall": 0.2007771126062864, "rougeLsum_recall_stderr": 0.0026617775847568633}}, "4": {"tldr_en": {"bleu": 0.35442363598057186, "bleu_stderr": 0.02957890609663373, "rouge1_fmeasure": 0.04990479829313592, "rouge1_fmeasure_stderr": 0.0017225289026089794, "rouge1_precision": 0.04727049455418174, "rouge1_precision_stderr": 0.0018100262381206956, "rouge1_recall": 0.07308789496556233, "rouge1_recall_stderr": 0.002548253609808092, "rouge2_fmeasure": 0.009704784607524384, "rouge2_fmeasure_stderr": 0.0005246010118344956, "rouge2_precision": 0.009152769715333476, "rouge2_precision_stderr": 0.0005809882470945591, "rouge2_recall": 0.014793686682183805, "rouge2_recall_stderr": 0.0008871836496692909, "rougeL_fmeasure": 0.038102997687537214, "rougeL_fmeasure_stderr": 0.0012904657107170763, "rougeL_precision": 0.03634445955852837, "rougeL_precision_stderr": 0.0014097418513319498, "rougeL_recall": 0.05712304517098294, "rougeL_recall_stderr": 0.002020929141181275, "rougeLsum_fmeasure": 0.04692854753900321, "rougeLsum_fmeasure_stderr": 0.001615455808763454, "rougeLsum_precision": 0.04450904725651575, "rougeLsum_precision_stderr": 0.0017072089167818546, "rougeLsum_recall": 0.06907832245228929, "rougeLsum_recall_stderr": 0.002416204133617309}}, "5": {"tldr_en": {"bleu": 2.3773909381181067e-07, "bleu_stderr": 6.777702484631335e-07, "rouge1_fmeasure": 0.007934022472178462, "rouge1_fmeasure_stderr": 0.0007646898711388704, "rouge1_precision": 0.007806943563100253, "rouge1_precision_stderr": 0.0008029596223294583, "rouge1_recall": 0.011916878778381854, "rouge1_recall_stderr": 0.0011710685254217557, "rouge2_fmeasure": 0.0014852201283601309, "rouge2_fmeasure_stderr": 0.00020361223200698468, "rouge2_precision": 0.0015499616053509758, "rouge2_precision_stderr": 0.00024432717225911417, "rouge2_recall": 0.0022995865319653413, "rouge2_recall_stderr": 0.00033582149369530104, "rougeL_fmeasure": 0.006092063289579814, "rougeL_fmeasure_stderr": 0.0005734478033484189, "rougeL_precision": 0.006059612662075617, "rougeL_precision_stderr": 0.0006187644415825575, "rougeL_recall": 0.009361683565350928, "rougeL_recall_stderr": 0.0009310373409583372, "rougeLsum_fmeasure": 0.007474906777946338, "rougeLsum_fmeasure_stderr": 0.0007195818405089297, "rougeLsum_precision": 0.0073509618326022316, "rougeLsum_precision_stderr": 0.0007548623257902688, "rougeLsum_recall": 0.011247516251388902, "rougeLsum_recall_stderr": 0.001102260125459754}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.8482338536273092, "bleu_stderr": 0.06579534941253831, "rouge1_fmeasure": 0.029524410502349083, "rouge1_fmeasure_stderr": 0.0012194408459950685, "rouge1_precision": 0.03689992434617125, "rouge1_precision_stderr": 0.00143080390296388, "rouge1_recall": 0.03176166527004807, "rouge1_recall_stderr": 0.0015278801549138494, "rouge2_fmeasure": 0.006282252522560226, "rouge2_fmeasure_stderr": 0.0005083233271996686, "rouge2_precision": 0.005295864917355121, "rouge2_precision_stderr": 0.000436477995087522, "rouge2_recall": 0.008570227243564495, "rouge2_recall_stderr": 0.0006945659775254231, "rougeL_fmeasure": 0.02704266874243934, "rougeL_fmeasure_stderr": 0.001092799039388727, "rougeL_precision": 0.034035125364177875, "rougeL_precision_stderr": 0.0013033143404442467, "rougeL_recall": 0.02894660702654024, "rougeL_recall_stderr": 0.0013685312959876327, "rougeLsum_fmeasure": 0.027093010874833397, "rougeLsum_fmeasure_stderr": 0.0011035568012963972, "rougeLsum_precision": 0.034329573061074765, "rougeLsum_precision_stderr": 0.0013151068156701008, "rougeLsum_recall": 0.028756511365956524, "rougeLsum_recall_stderr": 0.0013753740219635173}}, "1": {"generate_text_restaurant": {"bleu": 5.942260098167613, "bleu_stderr": 0.09441092756090216, "rouge1_fmeasure": 0.3304930105126096, "rouge1_fmeasure_stderr": 0.0020464079472463886, "rouge1_precision": 0.3146822903840917, "rouge1_precision_stderr": 0.0026228566349168303, "rouge1_recall": 0.4073067647472486, "rouge1_recall_stderr": 0.002694916559116025, "rouge2_fmeasure": 0.12621157789802925, "rouge2_fmeasure_stderr": 0.00144122341707661, "rouge2_precision": 0.11973672411480318, "rouge2_precision_stderr": 0.0017049415225723842, "rouge2_recall": 0.15858199335292084, "rouge2_recall_stderr": 0.001880021556117094, "rougeL_fmeasure": 0.24390496755077615, "rougeL_fmeasure_stderr": 0.0014758735639314516, "rougeL_precision": 0.23121444753390857, "rougeL_precision_stderr": 0.0019617352937841724, "rougeL_recall": 0.30603012289790815, "rougeL_recall_stderr": 0.002249710012043417, "rougeLsum_fmeasure": 0.27519248986257294, "rougeLsum_fmeasure_stderr": 0.0018786355388105225, "rougeLsum_precision": 0.26253682646143983, "rougeLsum_precision_stderr": 0.0023660383137224746, "rougeLsum_recall": 0.33971109353202855, "rougeLsum_recall_stderr": 0.002493554468070354}}, "2": {"generate_text_restaurant": {"bleu": 6.725052864934353, "bleu_stderr": 0.14629714654304157, "rouge1_fmeasure": 0.3455500221300751, "rouge1_fmeasure_stderr": 0.0020567847742166303, "rouge1_precision": 0.3370432420794776, "rouge1_precision_stderr": 0.0029582437787025427, "rouge1_recall": 0.41475409018206294, "rouge1_recall_stderr": 0.002581973755669344, "rouge2_fmeasure": 0.14215332459928473, "rouge2_fmeasure_stderr": 0.0015526430769182552, "rouge2_precision": 0.13924246863995587, "rouge2_precision_stderr": 0.0018935171496830272, "rouge2_recall": 0.17241918013486687, "rouge2_recall_stderr": 0.0019222974911274624, "rougeL_fmeasure": 0.26044817619281624, "rougeL_fmeasure_stderr": 0.0015920982446906947, "rougeL_precision": 0.25285247263136995, "rougeL_precision_stderr": 0.002281200773310861, "rougeL_recall": 0.31635151085258584, "rougeL_recall_stderr": 0.002181518712740274, "rougeLsum_fmeasure": 0.29316637284801744, "rougeLsum_fmeasure_stderr": 0.0019474180340165936, "rougeLsum_precision": 0.28533453436961675, "rougeLsum_precision_stderr": 0.0026174427606121924, "rougeLsum_recall": 0.35223597019269687, "rougeLsum_recall_stderr": 0.002458693422243018}}, "3": {"generate_text_restaurant": {"bleu": 6.973175823947467, "bleu_stderr": 0.08432471729881086, "rouge1_fmeasure": 0.3491442563303595, "rouge1_fmeasure_stderr": 0.002084406661790611, "rouge1_precision": 0.3372869158678504, "rouge1_precision_stderr": 0.002968659112264888, "rouge1_recall": 0.41917585622339343, "rouge1_recall_stderr": 0.0024657865682947604, "rouge2_fmeasure": 0.14925241670212142, "rouge2_fmeasure_stderr": 0.0015639781562393712, "rouge2_precision": 0.1451623356626606, "rouge2_precision_stderr": 0.001878882685675287, "rouge2_recall": 0.1805945511839357, "rouge2_recall_stderr": 0.001899662372461791, "rougeL_fmeasure": 0.2637903997625913, "rougeL_fmeasure_stderr": 0.0016349236936735077, "rougeL_precision": 0.25377095839457386, "rougeL_precision_stderr": 0.0023013165756289485, "rougeL_recall": 0.31994498910057845, "rougeL_recall_stderr": 0.0020988836643955253, "rougeLsum_fmeasure": 0.29641103594998963, "rougeLsum_fmeasure_stderr": 0.0019700089086597617, "rougeLsum_precision": 0.2861590985165946, "rougeLsum_precision_stderr": 0.0026614220152062383, "rougeLsum_recall": 0.35633299447456107, "rougeLsum_recall_stderr": 0.00237175789815616}}, "4": {"generate_text_restaurant": {"bleu": 6.781202241557229, "bleu_stderr": 0.11394876149110739, "rouge1_fmeasure": 0.34660270706267965, "rouge1_fmeasure_stderr": 0.002015167448860447, "rouge1_precision": 0.3287498306441592, "rouge1_precision_stderr": 0.002864037922185099, "rouge1_recall": 0.4242438979853323, "rouge1_recall_stderr": 0.002418778880597351, "rouge2_fmeasure": 0.1484646710112249, "rouge2_fmeasure_stderr": 0.0015009486601977229, "rouge2_precision": 0.14188074782669924, "rouge2_precision_stderr": 0.0018111547132663394, "rouge2_recall": 0.18330145095889133, "rouge2_recall_stderr": 0.001867227120259638, "rougeL_fmeasure": 0.2623953647532703, "rougeL_fmeasure_stderr": 0.0015873390211834876, "rougeL_precision": 0.24760447580397063, "rougeL_precision_stderr": 0.002205771870408524, "rougeL_recall": 0.3245629843061881, "rougeL_recall_stderr": 0.002091486936788564, "rougeLsum_fmeasure": 0.2952178835224044, "rougeLsum_fmeasure_stderr": 0.0019315028392222534, "rougeLsum_precision": 0.2799336817988539, "rougeLsum_precision_stderr": 0.0025898070057799047, "rougeLsum_recall": 0.36159803652552097, "rougeLsum_recall_stderr": 0.002354029382709626}}, "5": {"generate_text_restaurant": {"bleu": 6.685901964010736, "bleu_stderr": 0.1354495963808724, "rouge1_fmeasure": 0.3437737218331649, "rouge1_fmeasure_stderr": 0.0019546229382639466, "rouge1_precision": 0.32176357670299083, "rouge1_precision_stderr": 0.0027967903182063224, "rouge1_recall": 0.4272486932644093, "rouge1_recall_stderr": 0.0023809505635255927, "rouge2_fmeasure": 0.14683833434343727, "rouge2_fmeasure_stderr": 0.0014540710021065215, "rouge2_precision": 0.13815978485481578, "rouge2_precision_stderr": 0.0017518294091340995, "rouge2_recall": 0.18494316023841778, "rouge2_recall_stderr": 0.0018444532176795417, "rougeL_fmeasure": 0.2596864980022702, "rougeL_fmeasure_stderr": 0.0015675414220731314, "rougeL_precision": 0.2417191397949724, "rougeL_precision_stderr": 0.00214960916866614, "rougeL_recall": 0.32601659789964693, "rougeL_recall_stderr": 0.0020925727851936926, "rougeLsum_fmeasure": 0.29423382905586287, "rougeLsum_fmeasure_stderr": 0.0018901601807881775, "rougeLsum_precision": 0.27513062879919625, "rougeLsum_precision_stderr": 0.0025215646737994962, "rougeLsum_recall": 0.3659104174188377, "rougeLsum_recall_stderr": 0.0023445078388895997}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.445573424695658, "bleu_stderr": 0.15425934770761948, "rouge1_fmeasure": 0.19381060522505453, "rouge1_fmeasure_stderr": 0.0022326458513688033, "rouge1_precision": 0.14337493474921045, "rouge1_precision_stderr": 0.0018970632275809294, "rouge1_recall": 0.32850970396744716, "rouge1_recall_stderr": 0.0039197450040575135, "rouge2_fmeasure": 0.03756311678020454, "rouge2_fmeasure_stderr": 0.001356763612763011, "rouge2_precision": 0.027496214834546444, "rouge2_precision_stderr": 0.001054159884756719, "rouge2_recall": 0.06556453127883762, "rouge2_recall_stderr": 0.0023771544908032247, "rougeL_fmeasure": 0.14442948981860032, "rougeL_fmeasure_stderr": 0.0016582345165837742, "rougeL_precision": 0.10679400111516424, "rougeL_precision_stderr": 0.0014304369917064012, "rougeL_recall": 0.2459644623091805, "rougeL_recall_stderr": 0.002986298895539128, "rougeLsum_fmeasure": 0.15408798170242552, "rougeLsum_fmeasure_stderr": 0.0018796051363025486, "rougeLsum_precision": 0.11360184621025315, "rougeLsum_precision_stderr": 0.0015482924171113445, "rougeLsum_recall": 0.26296431121251945, "rougeLsum_recall_stderr": 0.003409100925773213}}, "1": {"article_DOC_summary": {"bleu": 0.6954014401170389, "bleu_stderr": 0.0939232317796097, "rouge1_fmeasure": 0.1513724503049335, "rouge1_fmeasure_stderr": 0.0020050978617654432, "rouge1_precision": 0.10765659328853563, "rouge1_precision_stderr": 0.0015212603420465503, "rouge1_recall": 0.2657263624255442, "rouge1_recall_stderr": 0.0033066001915549596, "rouge2_fmeasure": 0.01966067423050901, "rouge2_fmeasure_stderr": 0.0009461105744381743, "rouge2_precision": 0.013942450754043968, "rouge2_precision_stderr": 0.0006842372730185846, "rouge2_recall": 0.03481401056485645, "rouge2_recall_stderr": 0.0016493879352824244, "rougeL_fmeasure": 0.11639992980160706, "rougeL_fmeasure_stderr": 0.0014853662011968952, "rougeL_precision": 0.08261246482339596, "rougeL_precision_stderr": 0.0011168888732104218, "rougeL_recall": 0.20552675444508914, "rougeL_recall_stderr": 0.0025401789847852084, "rougeLsum_fmeasure": 0.12287565931519653, "rougeLsum_fmeasure_stderr": 0.0016075317103237032, "rougeLsum_precision": 0.08719479126054427, "rougeLsum_precision_stderr": 0.0012099004109665159, "rougeLsum_recall": 0.21714465186994203, "rougeLsum_recall_stderr": 0.0027534050196141966}}, "2": {"article_DOC_summary": {"bleu": 0.7307303414586408, "bleu_stderr": 0.06155547874417727, "rouge1_fmeasure": 0.15344534516159183, "rouge1_fmeasure_stderr": 0.0020053949533959292, "rouge1_precision": 0.10867457736153135, "rouge1_precision_stderr": 0.001495555344909094, "rouge1_recall": 0.27143929169611797, "rouge1_recall_stderr": 0.003394856674159156, "rouge2_fmeasure": 0.02144461765365429, "rouge2_fmeasure_stderr": 0.0009703360723919554, "rouge2_precision": 0.01507662196122561, "rouge2_precision_stderr": 0.0006861991351095634, "rouge2_recall": 0.03867163671633521, "rouge2_recall_stderr": 0.0017747285897281744, "rougeL_fmeasure": 0.11854204244373989, "rougeL_fmeasure_stderr": 0.0014924813777114118, "rougeL_precision": 0.08378473061167403, "rougeL_precision_stderr": 0.0011056093599254957, "rougeL_recall": 0.21115579128906609, "rougeL_recall_stderr": 0.002637225983534165, "rougeLsum_fmeasure": 0.12557130842107206, "rougeLsum_fmeasure_stderr": 0.0016648364713290837, "rougeLsum_precision": 0.08877022608536633, "rougeLsum_precision_stderr": 0.0012265040039533249, "rougeLsum_recall": 0.22324911827513313, "rougeLsum_recall_stderr": 0.0029138573801630453}}, "3": {"article_DOC_summary": {"bleu": 0.7723989217062374, "bleu_stderr": 0.07506332455732345, "rouge1_fmeasure": 0.1459946014022398, "rouge1_fmeasure_stderr": 0.002181990692411414, "rouge1_precision": 0.10592564096937784, "rouge1_precision_stderr": 0.0017525879317443233, "rouge1_recall": 0.2539427012445784, "rouge1_recall_stderr": 0.003731447303357977, "rouge2_fmeasure": 0.020061440587479485, "rouge2_fmeasure_stderr": 0.0009777698919290968, "rouge2_precision": 0.01420534449614851, "rouge2_precision_stderr": 0.0007006470449943444, "rouge2_recall": 0.03590630051582267, "rouge2_recall_stderr": 0.0017733541653792099, "rougeL_fmeasure": 0.11265406503599139, "rougeL_fmeasure_stderr": 0.001630908636011174, "rougeL_precision": 0.08153731863940099, "rougeL_precision_stderr": 0.0012887659869021155, "rougeL_recall": 0.19693769942475764, "rougeL_recall_stderr": 0.002869678698254578, "rougeLsum_fmeasure": 0.11915978365542443, "rougeLsum_fmeasure_stderr": 0.0017414042260366922, "rougeLsum_precision": 0.08628916736533274, "rougeLsum_precision_stderr": 0.0013712543798638922, "rougeLsum_recall": 0.2081960052350543, "rougeLsum_recall_stderr": 0.0030602079181311892}}, "4": {"article_DOC_summary": {"bleu": 0.4202554532269484, "bleu_stderr": 0.12262307961277104, "rouge1_fmeasure": 0.040215681107462056, "rouge1_fmeasure_stderr": 0.002237517556474153, "rouge1_precision": 0.034471583104804415, "rouge1_precision_stderr": 0.002238315408267895, "rouge1_recall": 0.06381728541655798, "rouge1_recall_stderr": 0.0036282870714125083, "rouge2_fmeasure": 0.004935566104695442, "rouge2_fmeasure_stderr": 0.0005753566907154545, "rouge2_precision": 0.003871537312889549, "rouge2_precision_stderr": 0.0005719133532575095, "rouge2_recall": 0.008269838331766569, "rouge2_recall_stderr": 0.0009564670794954605, "rougeL_fmeasure": 0.030441951036000715, "rougeL_fmeasure_stderr": 0.0016864228566178527, "rougeL_precision": 0.026758973645767164, "rougeL_precision_stderr": 0.0018801400712648681, "rougeL_recall": 0.04838251241637687, "rougeL_recall_stderr": 0.0027529301388328257, "rougeLsum_fmeasure": 0.03296335745988539, "rougeLsum_fmeasure_stderr": 0.001842268360788242, "rougeLsum_precision": 0.028758380610237905, "rougeLsum_precision_stderr": 0.0019838383896546154, "rougeLsum_recall": 0.052394609604491466, "rougeLsum_recall_stderr": 0.00300800960671939}}, "5": {"article_DOC_summary": {"bleu": 1.2660127317243813e-38, "bleu_stderr": 3.8267567150622576e-33, "rouge1_fmeasure": 0.002135746093866511, "rouge1_fmeasure_stderr": 0.0005838656686162581, "rouge1_precision": 0.002427203615941276, "rouge1_precision_stderr": 0.0006831484429133202, "rouge1_recall": 0.0019840191933539033, "rouge1_recall_stderr": 0.0005303913662852268, "rouge2_fmeasure": 0.00030743447999977873, "rouge2_fmeasure_stderr": 0.00013023642706646356, "rouge2_precision": 0.0003678072143665929, "rouge2_precision_stderr": 0.00015846001855024936, "rouge2_recall": 0.0002682301974754805, "rouge2_recall_stderr": 0.0001131215031105469, "rougeL_fmeasure": 0.001686259301474979, "rougeL_fmeasure_stderr": 0.0004921843202278661, "rougeL_precision": 0.0019066685986482705, "rougeL_precision_stderr": 0.0005793006239621258, "rougeL_recall": 0.001578844696073063, "rougeL_recall_stderr": 0.00044617009211618964, "rougeLsum_fmeasure": 0.001735086296720847, "rougeLsum_fmeasure_stderr": 0.0004903196095708464, "rougeLsum_precision": 0.0019704357925048386, "rougeLsum_precision_stderr": 0.0005792873025022089, "rougeLsum_recall": 0.00161831401010321, "rougeLsum_recall_stderr": 0.0004437097896608957}}}} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..816dda6b1a2eb6afbdb01f604e6680c5c87d3a0e --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.26787629279095865, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02421388470865588 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.053140729220499526, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001447561888642144 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2650539620149166, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004611089062355459 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.07916714595011602, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0016165914559961 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.021704917896300822, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009077529999546599 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.10624239698539174, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0029454877090427634 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.03206245161358705, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009944025304645106 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.04859565080529351, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013030805071960487 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24447365028169235, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0042597620469032324 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.07256452976899888, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014455163882477753 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.04911887572948648, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013308973848181627 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.24529807807313986, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004231057274690599 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07317950398891415, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014738730467798152 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..3dc46cce007e915a3e27290f0cbdd72a374f7b65 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.27346154994880517, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02188738307683954 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.047626171506349936, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011352906867889128 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.26035399188160574, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004602505397267029 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.07424112149389747, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0013991731147740165 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.01795733317688481, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006207760872719163 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.10255465178172037, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0028918136354984434 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.028108438388606747, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008209525600219419 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.04253166976477524, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0009520378507813956 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.23570739197296856, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004138563159116714 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.06664007036780817, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001225946991287631 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.044154443741561675, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0010805238879022037 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.24018067638000298, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004203191799368478 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.06858259906736544, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001295048790148881 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..67f6facb9545da06c0312aa425efbae9a9c32432 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.28354223508209625, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02196438336730763 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.04907071394368477, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0011814228439300668 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2717922146470884, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004679127784588707 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.077057196050893, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001405552196581262 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.01847026867964925, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006271549211076853 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.10837787945721133, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00292786577048572 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.029195418367829688, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008404145834110129 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.043547243362200026, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0010632111900203151 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24217304687370458, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0041386950242398935 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.0683478121462329, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001219408641805486 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.04538438937137174, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0010999742522302452 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2509319606971942, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004265166783401968 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07117154749767428, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001278540354605195 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..61c5697876b907e6bb51c3f005e298234f44a80e --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.26231700778830913, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.01677381795342571 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.048773010954172226, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0010801404950998403 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.2723524322573744, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004614644088480283 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.07701202526647727, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0013264916492560968 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.01830389408829641, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000765761231033471 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.10724024189536346, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0029417688916459905 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.028476680174906326, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007831062590315599 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.04285349136828219, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0009848666531091866 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.23931793383909106, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0039933449779696656 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.06751038060872314, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0011522535843318086 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.045262801919532414, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001021866086917732 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25210574997713586, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004210876653447827 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.0713319417621141, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0012205962369251139 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..41b972aae9d5300866021636f1f4f4220a0124ea --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.2909737297069181, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.016893325417647067 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.05081036279065346, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001340290442932179 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.27689930067824825, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004592552339097503 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.07880513839875916, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0013577530127801877 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.02000297688991883, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009665376160012339 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1098959472411629, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0029265187187869925 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.029911000513183756, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008104665489277981 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.04469978216410197, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001228415770141008 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.24325022171643784, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.003959401381097609 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.06910981407367636, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001165837956941959 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.047479319186822515, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012835127261851631 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25785008091098, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004217817751472416 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07342750134261251, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0012548900975791317 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c90ad612881326708ef39fd1523af25dea28f344 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.275592913998383, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.010675634701516879 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.050188036684923054, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0010589097851446405 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.28261873177986385, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004706167216581722 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.07936270839708998, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0013461361721732127 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.018414057787839, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0005667544666951426 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.11149049346375932, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.002957507274568516 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.029335540062254653, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00077573226541773 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.04348160210158506, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0009025307067376957 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2468060892224703, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004013696328255729 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.06878175079936166, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0011305052098162837 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.046368846883703685, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0009967098378676012 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.25991163700009623, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0042359736213800495 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.07315850261422062, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0012299656434355821 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4f8edb4da64bf491a49060a3e16efd85f82cac04 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1508638357497856, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019477340479700028 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.24849466528414227, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025701642988402284 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17351939045996323, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018292808999788056 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.028565167813151382, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007213658899061881 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04860070927724722, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012792940293872988 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.033112770233475294, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007842583345225733 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11205417400994366, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001364543594879335 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19083146969499562, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020249121235725457 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1300215852768387, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012668686976567704 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14039987541721508, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001794428495675629 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23240706811113432, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002406095416292502 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16176041579500514, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016905736140852296 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.4498797804800554, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.030033155430787307 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..131449da31df071e28ec372947d7def2e67fd353 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1526735082069478, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001954192368311485 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2537630901501927, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025247263534353263 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17598744290815144, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001808190292239866 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.02844271878006758, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007501808391968073 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.048050899811526195, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013077335984725508 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.032548106421086444, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007854290741659407 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11085969871259992, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013092492625755249 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1910548183701386, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0019406911815812453 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1291623611792601, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012144030507005796 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14352989085571205, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018308845070724087 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23982592472606548, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024037588777864357 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1656292822984552, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016884673231307584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5523030824089203, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0404745781112937 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..d85ccad272099f8f8e328df25c86df83ce7f5236 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15614318865894197, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001953522003890445 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2564233598947695, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002443975404517576 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17851912473986262, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017588268154772792 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.028786254184172754, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007381734830468564 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04721098878117776, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0012484536682449941 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.032531974500306655, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007707378614567543 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11436547586059817, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013634627836511027 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19403348190827804, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.001915506475404068 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13175959208331914, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00119267469976916 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14706172179649213, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018475712783318878 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24190155350034248, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023184025713278256 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16809587331436024, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001653116049291498 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5504469719150438, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.046981957687555205 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..259f0fa96aaee030bec8fe5afe27ba76d4aa243c --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.13699405852667912, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0022271962965683227 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.21313164031151458, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028175993079765913 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.14977645750144936, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00199726722683507 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.025286085868956577, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007388515719204758 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.04046828319806029, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001196737089891652 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.027873427098971903, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0007427085100927844 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10087113357194523, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016060316815470442 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1621097484851492, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021946464603937125 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.11096435645199118, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014009503741229052 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1288247035213342, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020910254870389346 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2007771126062864, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0026617775847568633 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1408419182005074, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018690086358082113 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.6506772563162972, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07202666343435976 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..385a4f2a38f59321c044a3892b88617cb7e0106c --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.04727049455418174, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018100262381206956 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07308789496556233, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002548253609808092 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.04990479829313592, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017225289026089794 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.009152769715333476, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0005809882470945591 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.014793686682183805, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0008871836496692909 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.009704784607524384, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0005246010118344956 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.03634445955852837, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014097418513319498 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.05712304517098294, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002020929141181275 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.038102997687537214, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012904657107170763 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.04450904725651575, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017072089167818546 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.06907832245228929, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002416204133617309 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.04692854753900321, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001615455808763454 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.35442363598057186, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02957890609663373 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..36a4b743b13bcf2d13fe3d33af55680b5d50822e --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.007806943563100253, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008029596223294583 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.011916878778381854, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0011710685254217557 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.007934022472178462, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0007646898711388704 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0015499616053509758, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00024432717225911417 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0022995865319653413, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00033582149369530104 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0014852201283601309, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00020361223200698468 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006059612662075617, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0006187644415825575 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.009361683565350928, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009310373409583372 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006092063289579814, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0005734478033484189 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.0073509618326022316, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007548623257902688 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.011247516251388902, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.001102260125459754 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.007474906777946338, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007195818405089297 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.3773909381181067e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 6.777702484631335e-07 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..97f1ca2eeb46fc366486a0e31ee7764f26809cc8 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.8482338536273092, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.06579534941253831 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.03689992434617125, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00143080390296388 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.03176166527004807, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0015278801549138494 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.029524410502349083, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0012194408459950685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.005295864917355121, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.000436477995087522 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.008570227243564495, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0006945659775254231 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.006282252522560226, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0005083233271996686 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.034035125364177875, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0013033143404442467 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.02894660702654024, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0013685312959876327 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.02704266874243934, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001092799039388727 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.034329573061074765, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0013151068156701008 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.028756511365956524, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0013753740219635173 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.027093010874833397, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0011035568012963972 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..eb776e610e25289a08779bc4a855fe7db42f8754 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 5.942260098167613, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.09441092756090216 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3146822903840917, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0026228566349168303 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4073067647472486, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002694916559116025 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3304930105126096, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020464079472463886 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.11973672411480318, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017049415225723842 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.15858199335292084, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001880021556117094 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.12621157789802925, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00144122341707661 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.23121444753390857, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0019617352937841724 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.30603012289790815, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002249710012043417 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.24390496755077615, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014758735639314516 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.26253682646143983, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0023660383137224746 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.33971109353202855, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002493554468070354 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.27519248986257294, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018786355388105225 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c636af57e340a4f35eeb011026bec4e698845c48 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.725052864934353, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14629714654304157 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3370432420794776, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0029582437787025427 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.41475409018206294, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002581973755669344 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3455500221300751, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020567847742166303 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.13924246863995587, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0018935171496830272 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.17241918013486687, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019222974911274624 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.14215332459928473, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0015526430769182552 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.25285247263136995, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002281200773310861 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.31635151085258584, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002181518712740274 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.26044817619281624, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015920982446906947 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.28533453436961675, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0026174427606121924 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.35223597019269687, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002458693422243018 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.29316637284801744, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019474180340165936 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ef7f09978dc3496e0316c39e7348082c08ca18a4 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.973175823947467, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.08432471729881086 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3372869158678504, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002968659112264888 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.41917585622339343, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0024657865682947604 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3491442563303595, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002084406661790611 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.1451623356626606, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.001878882685675287 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1805945511839357, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001899662372461791 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.14925241670212142, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0015639781562393712 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.25377095839457386, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0023013165756289485 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.31994498910057845, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0020988836643955253 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2637903997625913, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016349236936735077 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2861590985165946, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0026614220152062383 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.35633299447456107, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.00237175789815616 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.29641103594998963, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019700089086597617 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a35d77278fb0156fc8a3af43583941ab951af684 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.781202241557229, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.11394876149110739 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3287498306441592, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002864037922185099 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4242438979853323, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002418778880597351 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.34660270706267965, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002015167448860447 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.14188074782669924, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0018111547132663394 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.18330145095889133, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001867227120259638 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1484646710112249, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0015009486601977229 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.24760447580397063, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002205771870408524 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3245629843061881, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002091486936788564 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2623953647532703, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015873390211834876 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2799336817988539, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0025898070057799047 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.36159803652552097, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002354029382709626 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.2952178835224044, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019315028392222534 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b3e7b9f79d009a85009064fb5b8bd0299e21c1cd --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.685901964010736, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1354495963808724 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.32176357670299083, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0027967903182063224 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4272486932644093, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0023809505635255927 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3437737218331649, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019546229382639466 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.13815978485481578, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017518294091340995 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.18494316023841778, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0018444532176795417 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.14683833434343727, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0014540710021065215 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2417191397949724, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.00214960916866614 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32601659789964693, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0020925727851936926 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2596864980022702, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015675414220731314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.27513062879919625, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0025215646737994962 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3659104174188377, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0023445078388895997 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.29423382905586287, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018901601807881775 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_0.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..558edabb684c8eac1f6376606b3512ae63a809a2 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.14337493474921045, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018970632275809294 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.32850970396744716, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0039197450040575135 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.19381060522505453, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022326458513688033 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.027496214834546444, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.001054159884756719 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06556453127883762, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0023771544908032247 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03756311678020454, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001356763612763011 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.10679400111516424, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014304369917064012 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2459644623091805, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002986298895539128 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.14442948981860032, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016582345165837742 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.11360184621025315, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015482924171113445 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26296431121251945, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003409100925773213 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15408798170242552, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018796051363025486 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.445573424695658, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.15425934770761948 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_1.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f54e787f26891e6a98c8df781c72e3dfce051c7b --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10765659328853563, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0015212603420465503 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2657263624255442, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0033066001915549596 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1513724503049335, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0020050978617654432 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.013942450754043968, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006842372730185846 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.03481401056485645, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0016493879352824244 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.01966067423050901, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009461105744381743 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08261246482339596, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0011168888732104218 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.20552675444508914, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0025401789847852084 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11639992980160706, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0014853662011968952 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08719479126054427, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0012099004109665159 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.21714465186994203, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0027534050196141966 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12287565931519653, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0016075317103237032 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.6954014401170389, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0939232317796097 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_2.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a493df44349834ee4d661b528565db21b6cd894d --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10867457736153135, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001495555344909094 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.27143929169611797, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003394856674159156 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.15344534516159183, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0020053949533959292 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01507662196122561, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006861991351095634 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.03867163671633521, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0017747285897281744 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.02144461765365429, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009703360723919554 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08378473061167403, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0011056093599254957 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.21115579128906609, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002637225983534165 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11854204244373989, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0014924813777114118 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08877022608536633, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0012265040039533249 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22324911827513313, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0029138573801630453 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12557130842107206, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0016648364713290837 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7307303414586408, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.06155547874417727 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_3.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..74c7fee769eb6dada3fee0432246f0354267e990 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.10592564096937784, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017525879317443233 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2539427012445784, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003731447303357977 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1459946014022398, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002181990692411414 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01420534449614851, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007006470449943444 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.03590630051582267, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0017733541653792099 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.020061440587479485, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0009777698919290968 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08153731863940099, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0012887659869021155 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.19693769942475764, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.002869678698254578 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.11265406503599139, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001630908636011174 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.08628916736533274, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0013712543798638922 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2081960052350543, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0030602079181311892 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.11915978365542443, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0017414042260366922 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.7723989217062374, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07506332455732345 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_4.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..b791e0412e4724b51e341158f871482e770d837a --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.034471583104804415, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002238315408267895 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.06381728541655798, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0036282870714125083 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.040215681107462056, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002237517556474153 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.003871537312889549, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0005719133532575095 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.008269838331766569, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0009564670794954605 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.004935566104695442, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0005753566907154545 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.026758973645767164, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0018801400712648681 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.04838251241637687, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0027529301388328257 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.030441951036000715, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0016864228566178527 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.028758380610237905, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0019838383896546154 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.052394609604491466, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00300800960671939 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03296335745988539, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.001842268360788242 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.4202554532269484, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.12262307961277104 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_5.json b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b58218b1b4012f908fb7c2ff103153806db3a9ca --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/generation/slim.4b284b1b9c4seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.002427203615941276, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0006831484429133202 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0019840191933539033, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0005303913662852268 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002135746093866511, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0005838656686162581 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0003678072143665929, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00015846001855024936 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0002682301974754805, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0001131215031105469 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00030743447999977873, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00013023642706646356 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0019066685986482705, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0005793006239621258 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.001578844696073063, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00044617009211618964 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.001686259301474979, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0004921843202278661 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0019704357925048386, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0005792873025022089 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.00161831401010321, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0004437097896608957 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.001735086296720847, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0004903196095708464 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.2660127317243813e-38, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 3.8267567150622576e-33 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b1b9c4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_0.csv b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..e0df603a87c36e3d00605a78d7cb31b3bac9a7b3 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.318,0.014734079309311901,0 +anli_r2,acc,0.316,0.014709193056057111,0 +anli_r3,acc,0.33416666666666667,0.013622434813136785,0 +arc_challenge,acc,0.2380546075085324,0.012445770028026208,0 +arc_challenge,acc_norm,0.2508532423208191,0.012668198621315432,0 +arc_easy,acc,0.4852693602693603,0.010255329977562098,0 +arc_easy,acc_norm,0.45075757575757575,0.010209906101011116,0 +boolq,acc,0.4666666666666667,0.008725599880049204,1 +cb,acc,0.25,0.058387420812114225,1 +cb,f1,0.18062893081761008,,1 +copa,acc,0.72,0.04512608598542127,0 +hellaswag,acc,0.39533957379008167,0.0048792428484734605,0 +hellaswag,acc_norm,0.49571798446524595,0.004989598426249536,0 +piqa,acc,0.70620239390642,0.010627574080514802,0 +piqa,acc_norm,0.7034820457018498,0.010656078922661133,0 +rte,acc,0.51985559566787,0.030072723167317177,0 +sciq,acc,0.727,0.014095022868717581,0 +sciq,acc_norm,0.654,0.015050266127564448,0 +storycloze_2016,acc,0.6659540352752539,0.010906978048365164,0 +winogrande,acc,0.5327545382794001,0.014022300570434132,0 diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_0.json b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_0.json new file mode 100644 index 0000000000000000000000000000000000000000..5e038b2c4d8cbba0c0c9863d471d7c2a9ec94c86 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.318, + "acc_stderr": 0.014734079309311901 + }, + "anli_r2": { + "acc": 0.316, + "acc_stderr": 0.014709193056057111 + }, + "anli_r3": { + "acc": 0.33416666666666667, + "acc_stderr": 0.013622434813136785 + }, + "cb": { + "acc": 0.25, + "acc_stderr": 0.058387420812114225, + "f1": 0.18062893081761008 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542127 + }, + "hellaswag": { + "acc": 0.39533957379008167, + "acc_stderr": 0.0048792428484734605, + "acc_norm": 0.49571798446524595, + "acc_norm_stderr": 0.004989598426249536 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.5327545382794001, + "acc_stderr": 0.014022300570434132 + }, + "storycloze_2016": { + "acc": 0.6659540352752539, + "acc_stderr": 0.010906978048365164 + }, + "boolq": { + "acc": 0.4666666666666667, + "acc_stderr": 0.008725599880049204 + }, + "arc_easy": { + "acc": 0.4852693602693603, + "acc_stderr": 0.010255329977562098, + "acc_norm": 0.45075757575757575, + "acc_norm_stderr": 0.010209906101011116 + }, + "arc_challenge": { + "acc": 0.2380546075085324, + "acc_stderr": 0.012445770028026208, + "acc_norm": 0.2508532423208191, + "acc_norm_stderr": 0.012668198621315432 + }, + "sciq": { + "acc": 0.727, + "acc_stderr": 0.014095022868717581, + "acc_norm": 0.654, + "acc_norm_stderr": 0.015050266127564448 + }, + "piqa": { + "acc": 0.70620239390642, + "acc_stderr": 0.010627574080514802, + "acc_norm": 0.7034820457018498, + "acc_norm_stderr": 0.010656078922661133 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_1.csv b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..e684882644fdd6b96bfb26eba1f4e2aef5f5a971 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.332,0.014899597242811483,0 +anli_r2,acc,0.344,0.015029633724408947,0 +anli_r3,acc,0.3375,0.013655897185463653,0 +arc_challenge,acc,0.22184300341296928,0.012141659068147884,0 +arc_challenge,acc_norm,0.23720136518771331,0.01243039982926085,0 +arc_easy,acc,0.4663299663299663,0.010236494647406476,0 +arc_easy,acc_norm,0.4591750841750842,0.010225526906982606,0 +boolq,acc,0.43730886850152906,0.008676043429497427,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.285919540229885,,1 +copa,acc,0.68,0.04688261722621505,0 +hellaswag,acc,0.39912368054172476,0.004887174080003037,0 +hellaswag,acc_norm,0.4940250946026688,0.0049894251333779055,0 +piqa,acc,0.6996735582154516,0.010695225308183138,0 +piqa,acc_norm,0.7018498367791077,0.01067296411400829,0 +rte,acc,0.48014440433212996,0.0300727231673172,0 +sciq,acc,0.737,0.013929286594259741,0 +sciq,acc_norm,0.679,0.014770821817934649,0 +storycloze_2016,acc,0.6451095670764297,0.011064787659904119,0 +winogrande,acc,0.526440410418311,0.01403282387440722,0 diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_1.json b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c19232dbb0dd3f3954486ae6ba2cdbbac672b02f --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.332, + "acc_stderr": 0.014899597242811483 + }, + "anli_r2": { + "acc": 0.344, + "acc_stderr": 0.015029633724408947 + }, + "anli_r3": { + "acc": 0.3375, + "acc_stderr": 0.013655897185463653 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.285919540229885 + }, + "copa": { + "acc": 0.68, + "acc_stderr": 0.04688261722621505 + }, + "hellaswag": { + "acc": 0.39912368054172476, + "acc_stderr": 0.004887174080003037, + "acc_norm": 0.4940250946026688, + "acc_norm_stderr": 0.0049894251333779055 + }, + "rte": { + "acc": 0.48014440433212996, + "acc_stderr": 0.0300727231673172 + }, + "winogrande": { + "acc": 0.526440410418311, + "acc_stderr": 0.01403282387440722 + }, + "storycloze_2016": { + "acc": 0.6451095670764297, + "acc_stderr": 0.011064787659904119 + }, + "boolq": { + "acc": 0.43730886850152906, + "acc_stderr": 0.008676043429497427 + }, + "arc_easy": { + "acc": 0.4663299663299663, + "acc_stderr": 0.010236494647406476, + "acc_norm": 0.4591750841750842, + "acc_norm_stderr": 0.010225526906982606 + }, + "arc_challenge": { + "acc": 0.22184300341296928, + "acc_stderr": 0.012141659068147884, + "acc_norm": 0.23720136518771331, + "acc_norm_stderr": 0.01243039982926085 + }, + "sciq": { + "acc": 0.737, + "acc_stderr": 0.013929286594259741, + "acc_norm": 0.679, + "acc_norm_stderr": 0.014770821817934649 + }, + "piqa": { + "acc": 0.6996735582154516, + "acc_stderr": 0.010695225308183138, + "acc_norm": 0.7018498367791077, + "acc_norm_stderr": 0.01067296411400829 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_2.csv b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..2804c253e93af9648b1fa0cd8ec679c063b52d86 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.319,0.01474640486547348,0 +anli_r2,acc,0.35,0.015090650341444231,0 +anli_r3,acc,0.3258333333333333,0.013535422043417455,0 +arc_challenge,acc,0.22184300341296928,0.012141659068147884,0 +arc_challenge,acc_norm,0.25853242320819114,0.012794553754288684,0 +arc_easy,acc,0.4781144781144781,0.010249950427234155,0 +arc_easy,acc_norm,0.46254208754208753,0.010230952104570805,0 +boolq,acc,0.4437308868501529,0.008689501105367406,1 +cb,acc,0.4107142857142857,0.06633634150359541,1 +cb,f1,0.2796474358974359,,1 +copa,acc,0.65,0.047937248544110196,0 +hellaswag,acc,0.3988249352718582,0.0048865590087549884,0 +hellaswag,acc_norm,0.4953196574387572,0.004989562798280527,0 +piqa,acc,0.6953210010881393,0.010738889044325161,0 +piqa,acc_norm,0.7018498367791077,0.010672964114008301,0 +rte,acc,0.5270758122743683,0.030052303463143706,0 +sciq,acc,0.754,0.013626065817750641,0 +sciq,acc_norm,0.714,0.014297146862517908,0 +storycloze_2016,acc,0.6509887760555852,0.011022640519108546,0 +winogrande,acc,0.5185477505919495,0.014042813708888378,0 diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_2.json b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2d7e461b7a817f68c80b50605102d984d59fe622 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.319, + "acc_stderr": 0.01474640486547348 + }, + "anli_r2": { + "acc": 0.35, + "acc_stderr": 0.015090650341444231 + }, + "anli_r3": { + "acc": 0.3258333333333333, + "acc_stderr": 0.013535422043417455 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.2796474358974359 + }, + "copa": { + "acc": 0.65, + "acc_stderr": 0.047937248544110196 + }, + "hellaswag": { + "acc": 0.3988249352718582, + "acc_stderr": 0.0048865590087549884, + "acc_norm": 0.4953196574387572, + "acc_norm_stderr": 0.004989562798280527 + }, + "rte": { + "acc": 0.5270758122743683, + "acc_stderr": 0.030052303463143706 + }, + "winogrande": { + "acc": 0.5185477505919495, + "acc_stderr": 0.014042813708888378 + }, + "storycloze_2016": { + "acc": 0.6509887760555852, + "acc_stderr": 0.011022640519108546 + }, + "boolq": { + "acc": 0.4437308868501529, + "acc_stderr": 0.008689501105367406 + }, + "arc_easy": { + "acc": 0.4781144781144781, + "acc_stderr": 0.010249950427234155, + "acc_norm": 0.46254208754208753, + "acc_norm_stderr": 0.010230952104570805 + }, + "arc_challenge": { + "acc": 0.22184300341296928, + "acc_stderr": 0.012141659068147884, + "acc_norm": 0.25853242320819114, + "acc_norm_stderr": 0.012794553754288684 + }, + "sciq": { + "acc": 0.754, + "acc_stderr": 0.013626065817750641, + "acc_norm": 0.714, + "acc_norm_stderr": 0.014297146862517908 + }, + "piqa": { + "acc": 0.6953210010881393, + "acc_stderr": 0.010738889044325161, + "acc_norm": 0.7018498367791077, + "acc_norm_stderr": 0.010672964114008301 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_3.csv b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..101098f504ffd6fb0bc711b4f075f026369220ed --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.334,0.014922019523732961,0 +anli_r2,acc,0.36,0.015186527932040126,0 +anli_r3,acc,0.3475,0.013751753243291854,0 +arc_challenge,acc,0.23208191126279865,0.012336718284948854,0 +arc_challenge,acc_norm,0.25597269624573377,0.012753013241244514,0 +arc_easy,acc,0.4877946127946128,0.010256726235129018,0 +arc_easy,acc_norm,0.46085858585858586,0.010228298200766124,0 +boolq,acc,0.4529051987767584,0.008706176885837736,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.34267399267399273,,1 +copa,acc,0.66,0.04760952285695237,0 +hellaswag,acc,0.3934475204142601,0.004875162699121657,0 +hellaswag,acc_norm,0.4903405696076479,0.004988850185477487,0 +piqa,acc,0.6964091403699674,0.010728079893076364,0 +piqa,acc_norm,0.7023939064200218,0.01066735379238821,0 +rte,acc,0.5126353790613718,0.030086851767188564,0 +sciq,acc,0.741,0.01386041525752791,0 +sciq,acc_norm,0.712,0.01432694179723156,0 +storycloze_2016,acc,0.6520577231427044,0.011014779784784831,0 +winogrande,acc,0.5059194948697711,0.014051500838485807,0 diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_3.json b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_3.json new file mode 100644 index 0000000000000000000000000000000000000000..6980f92b12fefe101b29ed4ab5c669fddf9373c7 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.334, + "acc_stderr": 0.014922019523732961 + }, + "anli_r2": { + "acc": 0.36, + "acc_stderr": 0.015186527932040126 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291854 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.34267399267399273 + }, + "copa": { + "acc": 0.66, + "acc_stderr": 0.04760952285695237 + }, + "hellaswag": { + "acc": 0.3934475204142601, + "acc_stderr": 0.004875162699121657, + "acc_norm": 0.4903405696076479, + "acc_norm_stderr": 0.004988850185477487 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5059194948697711, + "acc_stderr": 0.014051500838485807 + }, + "storycloze_2016": { + "acc": 0.6520577231427044, + "acc_stderr": 0.011014779784784831 + }, + "boolq": { + "acc": 0.4529051987767584, + "acc_stderr": 0.008706176885837736 + }, + "arc_easy": { + "acc": 0.4877946127946128, + "acc_stderr": 0.010256726235129018, + "acc_norm": 0.46085858585858586, + "acc_norm_stderr": 0.010228298200766124 + }, + "arc_challenge": { + "acc": 0.23208191126279865, + "acc_stderr": 0.012336718284948854, + "acc_norm": 0.25597269624573377, + "acc_norm_stderr": 0.012753013241244514 + }, + "sciq": { + "acc": 0.741, + "acc_stderr": 0.01386041525752791, + "acc_norm": 0.712, + "acc_norm_stderr": 0.01432694179723156 + }, + "piqa": { + "acc": 0.6964091403699674, + "acc_stderr": 0.010728079893076364, + "acc_norm": 0.7023939064200218, + "acc_norm_stderr": 0.01066735379238821 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_4.csv b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..1ea47a98632df078743a19211505fd99f7df9fd4 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.328,0.014853842487270334,0 +anli_r2,acc,0.352,0.015110404505648668,0 +anli_r3,acc,0.34,0.013680495725767789,0 +arc_challenge,acc,0.22696245733788395,0.01224049153613287,0 +arc_challenge,acc_norm,0.2525597269624573,0.012696728980207704,0 +arc_easy,acc,0.48063973063973064,0.01025208949116552,0 +arc_easy,acc_norm,0.46675084175084175,0.010237073872130747,0 +boolq,acc,0.43241590214067277,0.008664798701065797,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.23650793650793656,,1 +copa,acc,0.67,0.04725815626252609,0 +hellaswag,acc,0.3972316271659032,0.00488324657949666,0 +hellaswag,acc_norm,0.4969129655447122,0.004989686307484565,0 +piqa,acc,0.690424374319913,0.010786656752183345,0 +piqa,acc_norm,0.6958650707290533,0.010733493335721314,0 +rte,acc,0.51985559566787,0.030072723167317177,0 +sciq,acc,0.746,0.013772206565168544,0 +sciq,acc_norm,0.722,0.014174516461485256,0 +storycloze_2016,acc,0.6515232495991449,0.011018717784788488,0 +winogrande,acc,0.5059194948697711,0.014051500838485807,0 diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_4.json b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d306fa9bd5c1652df4c2541c8fd8da97183d23f3 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270334 + }, + "anli_r2": { + "acc": 0.352, + "acc_stderr": 0.015110404505648668 + }, + "anli_r3": { + "acc": 0.34, + "acc_stderr": 0.013680495725767789 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.23650793650793656 + }, + "copa": { + "acc": 0.67, + "acc_stderr": 0.04725815626252609 + }, + "hellaswag": { + "acc": 0.3972316271659032, + "acc_stderr": 0.00488324657949666, + "acc_norm": 0.4969129655447122, + "acc_norm_stderr": 0.004989686307484565 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.5059194948697711, + "acc_stderr": 0.014051500838485807 + }, + "storycloze_2016": { + "acc": 0.6515232495991449, + "acc_stderr": 0.011018717784788488 + }, + "boolq": { + "acc": 0.43241590214067277, + "acc_stderr": 0.008664798701065797 + }, + "arc_easy": { + "acc": 0.48063973063973064, + "acc_stderr": 0.01025208949116552, + "acc_norm": 0.46675084175084175, + "acc_norm_stderr": 0.010237073872130747 + }, + "arc_challenge": { + "acc": 0.22696245733788395, + "acc_stderr": 0.01224049153613287, + "acc_norm": 0.2525597269624573, + "acc_norm_stderr": 0.012696728980207704 + }, + "sciq": { + "acc": 0.746, + "acc_stderr": 0.013772206565168544, + "acc_norm": 0.722, + "acc_norm_stderr": 0.014174516461485256 + }, + "piqa": { + "acc": 0.690424374319913, + "acc_stderr": 0.010786656752183345, + "acc_norm": 0.6958650707290533, + "acc_norm_stderr": 0.010733493335721314 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_5.csv b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..c3ff05cff3b27beccdf61a30e0e3044a96df30c8 --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.329,0.014865395385928357,0 +anli_r2,acc,0.356,0.015149042659306623,0 +anli_r3,acc,0.3383333333333333,0.01366414400661828,0 +arc_challenge,acc,0.22696245733788395,0.012240491536132868,0 +arc_challenge,acc_norm,0.2551194539249147,0.012739038695202109,0 +arc_easy,acc,0.4802188552188552,0.010251751199542738,0 +arc_easy,acc_norm,0.4701178451178451,0.010241444322886432,0 +boolq,acc,0.4327217125382263,0.00866552668441624,1 +cb,acc,0.4642857142857143,0.0672477765493766,1 +cb,f1,0.2798941798941799,,1 +copa,acc,0.66,0.04760952285695237,0 +hellaswag,acc,0.39543915554670384,0.004879455474663814,0 +hellaswag,acc_norm,0.4986058554072894,0.004989762014739185,0 +piqa,acc,0.6942328618063112,0.010749627366141639,0 +piqa,acc_norm,0.7007616974972797,0.010684130673134581,0 +rte,acc,0.4981949458483754,0.030096267148976626,0 +sciq,acc,0.756,0.013588548437881431,0 +sciq,acc_norm,0.737,0.013929286594259717,0 +storycloze_2016,acc,0.6616782469267771,0.010941266252293478,0 +winogrande,acc,0.5035516969218626,0.014052131146915852,0 diff --git a/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_5.json b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a48b0aeb4af47e01db6c24a27fd725f065985afa --- /dev/null +++ b/4b284b1b9c4seed4/evaluation/rankeval/4b284b1b9c4seed4_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.329, + "acc_stderr": 0.014865395385928357 + }, + "anli_r2": { + "acc": 0.356, + "acc_stderr": 0.015149042659306623 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.01366414400661828 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.2798941798941799 + }, + "copa": { + "acc": 0.66, + "acc_stderr": 0.04760952285695237 + }, + "hellaswag": { + "acc": 0.39543915554670384, + "acc_stderr": 0.004879455474663814, + "acc_norm": 0.4986058554072894, + "acc_norm_stderr": 0.004989762014739185 + }, + "rte": { + "acc": 0.4981949458483754, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5035516969218626, + "acc_stderr": 0.014052131146915852 + }, + "storycloze_2016": { + "acc": 0.6616782469267771, + "acc_stderr": 0.010941266252293478 + }, + "boolq": { + "acc": 0.4327217125382263, + "acc_stderr": 0.00866552668441624 + }, + "arc_easy": { + "acc": 0.4802188552188552, + "acc_stderr": 0.010251751199542738, + "acc_norm": 0.4701178451178451, + "acc_norm_stderr": 0.010241444322886432 + }, + "arc_challenge": { + "acc": 0.22696245733788395, + "acc_stderr": 0.012240491536132868, + "acc_norm": 0.2551194539249147, + "acc_norm_stderr": 0.012739038695202109 + }, + "sciq": { + "acc": 0.756, + "acc_stderr": 0.013588548437881431, + "acc_norm": 0.737, + "acc_norm_stderr": 0.013929286594259717 + }, + "piqa": { + "acc": 0.6942328618063112, + "acc_stderr": 0.010749627366141639, + "acc_norm": 0.7007616974972797, + "acc_norm_stderr": 0.010684130673134581 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a4219a64b0935a2afa81700464d5fe44c51b30f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e59b8fd3c85e027e8a8c6fb5f56e269eb308c0bebd4a9ad89ea7c0193597b2 +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a224ae55a9bdb2905ddb9ae8307fd564e27c531c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3af1d957e635e97ac531f14e85e67de28bcbcf830d6c4f79357c6eedfda6b948 +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45504ad0b1c82fdd73ebb995bee1d688cda30294 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738a8953e172a31c9cb67cfb16cc287af590a316849c7732dc37f819449a899a +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1fd8170e44aaf9b05e2c7530d9e0a1f7c331663b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f21623b03c1918cda1b28f2c1454a8584e95a0fc4c983491f48862069002cb6c +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16bd6394a72af3736ef16643e28d07cec0b7ca83 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e0941fced7c62804c905aec71b512c116ad6d1328da5a08eb37b42da99d13fa +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d23b4a85bf2fa5ffb646acfd90cb75201a4b649f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c60191af5aece249a57bd3a101521c616763b9712b85dadb69b1ba558969104a +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e02afff0dd508d3728e24f956bdedc6a3b7c0d45 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26b645f5f3f9c656b0268a9604ac8bde0a578dc5588cee9b44752f1ae67970ce +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b54209b30d16d0fca206d65715fdaeab394cce9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d883be441c1a8bee08eb41565278ccc0daed912f5894f413b0047125c9b27046 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf1c1f6fcbdef08fe78ea7c0c6644a0773228280 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3fe0522087a70eb9fa8fbe6827d039a36a4906cfc74eed3c2d343e8c5042dbb +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..112a2a17c474755af435319df8baac36274b015c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51035780f64f4d15137e2ce76bf11e5820fe7aad50f5f85a06e2fff716153802 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bc5c96b27c2a24d05d2161cf609cffda2d21245 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:951ae031ba3a05eed9c0e2544070dbd41167d0aae2ed774c9a21ccad6213a70c +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..421ef93e47ef7419391c2b31e42a372a5582a946 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:974b33fc548afe7a92c57004c70ce6e4c26846814ef96d238542909992a7c884 +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f62704d8fe3469089af8431ea9ac66b9500cebc --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddb13d68f2fc3afdef3f0fc0e821ee9ac52b014ec01ba0d4a159742d90b93535 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65a7b68d843cc129657bf86a2269627503f6d573 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae34ff28af3b9543fe029d8e732b41f748300c141bda162507f6519f4e5650fb +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a865fd12e69732f2f2113f113467a8a85d957b1f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:489628231dff2aa9b3ddf31276db785dee1730080431b20b240716e3d0a39277 +size 199058669 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80e4122599371112e012edcf331ed468ad77eb8d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1c474073753468ddb176dbb179b039c411b814352cffb4c3e67bc5a264b81aa +size 199058669 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29b8a8dcc8ff82f92c80351965c6f447b97489d3 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da02690930c0e7f94c48c6393b4bfe00e9d149509ac4c7913382fdcce2f639b9 +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcbccf8f0fcfcca73f3b2a2f667d39647df6ab75 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e12b498958cdbcbe865d107ba5c4471bd84cdc20c242c61b212236709b282012 +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f40a38d6b91241098771d0498fac3a543cf6b29 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02b2b9b0a922fe31d140f59ab8bb188fd8c74c72f0424744aa5974cf31df264b +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b9808b92064c420c8d0e95ed4d35e56024a2365 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a29b77bb9561ada466910be3ccfbdd7d327d45656335b9c848307f7eb76710a9 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2453da1c64cab14d9a908b71cbdc6848dab289b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1eaaa729b8869c4e8b6f30c21c9bbb2cd475861c3093e6af4846d0392a38d72a +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35631b9696dd701c7e2a7f8e73fab50158355a7b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:243c38416273764d57464e8f9540ccc8c074a3d190fdb07c781b38c8425f6620 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10c606c98d32914da8f6016ab16210797082350c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11337f9223201547b93fbd1146a5734c95438fb0e6b3bd017f7fd79f68423ccf +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..904f39ec133fcf26561bd5ebc35dc6811a7cb3be --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa17a1d7d2af23c963765c1170af8377ca052d3202a0a29ca55c482b0825da84 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c2e2c7dc3a22f6b6094200db73b0d09fccadc97 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bccc23dd781424cfd22086a27699f0fb5b618796f9d20ba7f38eb10d02e3e941 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..197bd03e81cc580c0af2b5e0ed2966ff006ba975 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90720653e650556bf7bd7be7745f0ea25a5ae3fb31182b56b309b88cc1db3938 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9be1e23fad5bb8266ef0f44016401fc918299bf --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ab2915d1757dea6f04fd64cad84c7c2003333384418094af503c6138566c224 +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e744934fa63db851c1067bd54b84446f2d236dbe --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1ae97d7d038e2d3fb9e123ddd497c6fdd8f935b31527a530d77acd449b92b1d +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3d39235436b68fa54d7053615a4b9b9bd35c22b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2bea697ca2bdab25ee957f14c44cf3be31056f86c7c1419979130a10cc515e86 +size 199058605 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6122ec9c5b9843cb912be559c8e959cc571eadb9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d487992b16cfc23d14eff1df8d10eb9f053c5ba0df20ba75ecefab853fedd140 +size 199058605 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..145513c4ddb87fcf14a0c5b61422f3dfb02ca011 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d9d8a216b14505e67b0dce873f29140bac3dce24da15506c89eb1a2975a3512 +size 199058669 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd01f18cc00e0fe7806130b7af36dd26d7f4d77a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a734bb6d2469c5a9caa385ead62f59bba0ab3449e41249fec0718053144085b +size 199058669 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..321d76bb015548d5e281fa53aad98f7de39b642f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c8ce2b57b9e853bc225b54dbc4b57509971fe86396b3789e784b9703fb00b47 +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d28e122bfccc8720b99adff75b90b79e716e80b6 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa855bd6964aa6369175b3ddac94657eaf0f2710bc9de7b1a0d940a1aa3324b3 +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58c4b132b31402f8ebb54539566d0039152c3801 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e5a9f89d8c8ce91944b110df22f57ca342f4fb81ba39814fab6f5ba951a4ff1 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14b8001df645e26645b44c0f0a34c101340a7c1a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e20af9e2d0229d14a7727aca49ff9f2304451d5d42c90d6cacb2437f4f8f28ee +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..062289828519768838c346a913eba0777e6c6087 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da030de9e43ecc1d5b4fc65bbfb84c0c786faa6df2b6a9b2d02c7671dca2e005 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e22e79202e4d88bfd7b75b11da321a97c9ee184 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae1e42471dde30edd17261918a360742586d7de986b95c94e73e2657770df0e1 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d07e1d7ec984219873359c5ea5da960d67e3107 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0553e4f8c29b4aab41b357a7478febcbcc53a7c1f342b09be6ee8b9b285c0971 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15b7c91d4ba807e309fbebd851fdaa654690ca6d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb87d9fe788f154eef96a762d986f3a8cd90cdc906ca6b72a2c97de3e3366f39 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b143f1fe60802601def5845f49eb158389c0fef --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:173de3b5d46f2a7cc1656c441ffd23f2732151ee41f80a128cb0956f247d4fdd +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7e0f75562b83261617fed5b5dbbc60159466fa2 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f571b3bcab480dea6b7e81819f0d1d62c4ee74183f2c5ae09493e46e4bcacb5 +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4632750d1ed720314f29e5813a0311b6954f3fe6 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5dc24ed98e9c41eca76ba98067985dee02656e57bd6b27cdb0fc9290a70ba8f +size 199058669 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..568ca70a3c18a0d1ef41a47035f805b76dae6843 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d348eae70ff3b85f3f5b0dba7fb135b8eb333535af3c03bb61d1b8908c165894 +size 199058669 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23dac482ff5356126720b0aa1b0f4ceb58c6a495 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a00290be4077c57b54897959774602f2cb4d30a41f06405183e655f207a1d7d5 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1a079a0f0bbc09811803563843de432d6feda4f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0192c3868cced0a4164c99ff898a3a89b2ea2b5ecfa8fec2f5d7cded3b26a754 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65a72a43e8c214716c272098793c44f6868f57d0 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65dcdb562b4aab9aa674e4217c831d7ef217abd4981a57606e8d09834003b86d +size 199058669 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bdf5f26d5c7f1ff608f3557c018896375f0234d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54fc5c29e89b1cdd4d8890e1be27c297c14ca282ec86683bf8d8aed185d9fd88 +size 199058669 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aca6562e99f66a80d21e7d388a7ead91ff7860b4 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7013348053a0e763811e3200eaeaa1141243656cb29257cdd2ca93104889ea9e +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d41d7dd2f696a41b54008c04762136802fe02a4 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fabcee32dcea577c9921981051403c89e7dd183322bd36a3fe6b83052e326ed +size 199058797 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0dd1be2f8a6cd9f22eb69732306127a3fb64cfa4 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf7edb60626947f2a2861a864787cdf129b44e1f0d8b74bc0845cdb370764cf0 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24637c56a21c376cf56e1f5cd34465bc8d203059 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:428a358e489864be1ed849c6ea2fe2d51567a53d1c81a4b679a3cf639bf81aa6 +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb643c5c5f69faa332edd35e560acc62e158716a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cc13f05057428e04ccd8a2b9ea1eab30a75da9b765a88c187826605e18b9a5b +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6feb90ac72c827ab68cd2572f3f0d31fd35501b4 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:278d5c59529ca470895152d92e08bfc618af886f063ce12622ac58ce92b1e2ef +size 199058733 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d2ffcd84d8179287bc4a7533180eb60a0f96280 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b65e9c8c4e5a77b208e36d257e5cf898ae9d6d5ad56767ea136ceb4d0c6407 +size 199058669 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b7853b82acf765e682ffd4848dc9032f111ef9c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:494f089771f1f7a83d518ed8ccd172c2216be3355422b858c828262b37da1cad +size 199058669 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28a3ca970d4c482cbd789db6de4ad26715ad27f1 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5078addf610dc817e49e55dd0aebe92b0ecdf7cf1ce8f976212170f09e31639a +size 199058925 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ea046b7273add1c463789ddbff590d409e69a7d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5410263493491cba26693c0085866959c6d9af4e5eb6f158b2ce50c0fadfee57 +size 199058925 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d4e057829fe2b64bfbcb060f2ae5b01c970d674 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3da76f0702f88ad4edb4321e4908335521685c9db0c0031ab8b0dd04ca2dc9a6 +size 199058605 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..941f31671a6ec30dbcf908c5407c26048206ddac --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37008fc6175cb83acec9b687a4ffead82a069a877b49517eaaf57b8696489622 +size 199058605 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9266fadbcf657731b21f6dc7ee6f2e83a95913d7 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4400b352c79cfa7375c36f496a2c00c28bf4acf18b07672857917c60b715a80 +size 199058605 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..159726a87b6a4e26bf6dd58295af72b6d9da6481 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45b40c056214cd492d7a6688f00d6f49eb376f55f8c4321465e2c0fb9a4e2b12 +size 199058605 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff9b9aa9ebfdaaa27c720c628ad6f3857205b4e5 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddbbe312764428cb34438266b8894c1cf6b19db4e0059bf0f376d039d271df45 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a275b70e2d1cc30fe2f04dd45328a8f04eaf450 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cf621169628a202b65683ca40ce45b238bfee320039bf2c38bdeab853b0c707b +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2608ff8e1a3efc7cfd7cc7a4e9db0b7280755de --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7efa476bd6d29f079591ed77faff9fc8a2d5a793450cc07654ed27f478296d42 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d8bb1fdc3768a3e1b4058adbea39fff988b84c5 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3ebdae896fda7fb80be6baba047ef7a480700fb7e98ad72544a667437ca2623 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68dadce6364639eb7066b18d0c46220d75271017 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c37e58731b7d5db9a7a64cb435f3cef24a7b67a258561328e423a4735b45fe27 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62926a45fd7f4e9fdeff445c798c7299824b94e8 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d8ce5cae57fd3c099e0ed8cecf72b35d849b3bfaed1f55285f1f1f84be57c1d +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54e54b9e2ca993cb55490c28a628c191ed117321 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d04be391b3d2eea6e89d7a2f7604319341ae8bf39293fbdcec9b0456749e038 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2011caee085c9b78af7c44f2fb3ebfad703e19ad --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75b261a111a203264a017c2e6dea6cd72392fe59e022e0c03a0670d111d7425b +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2098e56386a381e8bd5b58615029c123c9254039 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c7ec968bdee29e812a128e67e898dff878253f9e874f958b05f96e9bb975b703 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..216f4d6fdf0cc3f99713695f5dee937a634c04b7 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f14ca20a35add06a0bcd7b57aba46bb5725d47d16f737a0383a523c86539ad7 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adcc7c1ee58c5145fded3d76ab26a6d21b82e707 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81bbc02f5d99b4fa8520310493007633bb50d824de00d974c57fae711fa3a6fc +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bd528ad067df68bb10ac27c118a4f606305c4b7 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:448c859e60eb1a3a46a94399ad8ce9d3bff2f72159654703b46131396d5361bd +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5c85b42a4c62f9f008ee732af4ac4cbe2faff89 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2252fbd87602835f6f6feabb59afe8fadeed7a4b77428e18e0d5521f39c01516 +size 199058978 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce53cf24eb91ff822e318892685f3ac351c6936f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c125d8f7db94a8aa60041c610579bfadd073d43b48700b44522731f1ba23fcba +size 199058978 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e3fb081880e6a3915b865ddbc0134d62799a102 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93fe8917b0df38310b38178119f9b6cc07677deb5123e940dd59a5dacd13d61e +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d01fc863b9c4a161040444028bbe444cd1f0fc3 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1351cd767b671bb9502cd409f20cef026089ab1ec5a92bb0dfc9cb0325acb134 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c9ae6e759c825a90171097041bcaa17f1f30194 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d72d35a82ca93c8d85a543379b95cde6d416b79a4b80a8f5de14d6207270de41 +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6dd52d3db868d1fd6a813758235f5b7e1c88a45b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c8e8c4ee897f07f97c94c0b031549fcb56749997c6e59a93ece53f39de6a9b2 +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bf9d2dc249abd43bd85222a0aa64b7dfb4d397a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff72b9e07cc10daaeb7d4d5b27d924e4df74fbe39916a349404b7714fc6b3caf +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45109bc8605fa3e7c1bb1525bcbce25969301c8a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16e2bd0c632f12c4a10eec5a61a7cb5329ce0a71593628f07857fa9d007eaa7b +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c1997354077fa41cb05c5b6b1cfdb3fa0742b1b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f92866f110f88d69783fec79621c9c6fc891f06a6f5065fb24e78e52fb3b8283 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f428a38c5851e21d0515ed6279d0b794e827bc1 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:838026d368fdc0b02736dc1534f10efc9cb3638646645d254d0c547cdc826a44 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d01be664ebaf9442458f79e58adb3d86a88b3727 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:747b2124fd008f18a0a2a89363aa2a093a374a65167138fdcbcb291cf91858f5 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a32a087e317f4eb949401acc1254137f33ad68e9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b31dde5ee48dd86e52ca65d6bff271a72a895dc3400422fc6f4f355cef620911 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c13be1562e6c0f7451d57a2d0ad1dd1b8d90619 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe5380b71344b57feff4df275c6f1ec7f17c5f092a9789b0b572aba7c58ca425 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fb0921f4141c92b338ebe2ae18b05b8ae2bde94 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbf66822656e8aeafb0c40d11c003895168c276639e16f6b2cde22a2f67ea468 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..37dcc15e82f0759ba38e736a8d5ac2166879510c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b39cde58aa4e9f2c52875a32faaa540ffb734af18081791b73181bf042e6fb3 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8885b493eb1f9e15a36ada300d24526db2e315e0 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a05d4766adb5b03b23c79ce4968563910fcc3ebf3d73acfc41ce2ad5dbc950 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c540f793630f0baf3223de29e60a40ba96cdfa09 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db4f1082554313d82913b5054549410f30130d26d39e0399d9f979dd9894a042 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a9be46ec300869bcf1083a126b0fb4387682b8a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb489162843124eb1a6d8bf4a363f3a8119956be2887d1f6dc1ed60aea3b300c +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..751b89c1e366b67b06291d9061f56637b80d0414 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a6bb55ef9d56e76f6091c601219b43c9064a5a95e34ec1b99ddf5bd55b73165 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f473a41de7695cc0c077b43d9f3b6588a465220a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:714c008702e24e2f2963e7ae15eb9ad919d701b0a11bfee93e554eabf89eac12 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9bbf1f0d0b0aa64f80404e0e7ee8dcd95bcc3f94 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5448a5769306d04cbca730b6c6bd994b459bd734972b37b08a213babb33a7031 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..736b232f68c410d1b1a30d96bc9e740653c2e784 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9c96f897c1f3360cceff445ce18cdb195af4236966232fff6dfeb898f3dc672 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be99589bf6f089ad733be536123ff46a02255241 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:706bf71ebec13f14967aca7a2d09c1f8bfb080df593788410037516d14cea3e9 +size 199058594 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..daaf96ac679014a06fcb35494269e011f7d2f34e --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d83c83aede6d8ea788fd30d44d5b225d36e83858a8b26c378d361e1b643450e4 +size 199058594 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8c2354cb80ce466148bc352fa39ce6dbc8a60187 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1367011ec567b2e7f7dd63a4985e32019eeb83eca513d8516b62e292e311d9da +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29c06c1f1b31d39f2d371fd699c1e4078aa3943e --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df12007ec6ad58c5a5ce699be5a604dfecffaff045ff35b2594ccbcd57149ffc +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4826efd8cc53d51475a8d6153f6528daeffccf2 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba8ee13615f120b072a4f284e0385d245e5d64cb2bae28f1b0e47d0e68eea786 +size 199058711 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bf89198b06f350135acddc97f1c6e3a35589648 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c2b9eea9a53b0292f9693f1e654475ae81af3768d57d2f705cd16dd8bf1783d +size 199058711 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e23015741cdaac6905bccc7669147aad8e7c8823 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:817707e9f03a9259f6f4c28ea235c4eee7810df5a751e04251f28029d5abf76f +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55be1571b705ed4b74e16d14f4a13a931a6c166c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:607045868d52fb7e79ee32fc00adcfafbc3b83a0b2debaac727fa7ed7e059573 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f0021a6fc9037fd07a1f928b7abc2a317df2517 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39dfb7ebc270433a06a8629bdfba453df44035c5e0d363399ac21ea1ab32b28b +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2402df3e2b8eec2f0d19d5888b6da93590d313ae --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:710c738a30170df6d46cc5176323a750c64d6fbc187226d2cc4a5d36692cb3b4 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d32dc316d13d89bad45202630e52c4ee7a8002f3 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2e8176613d73da121720fc8f3d5912fc1fa4a4a882b8cf36953cb50eecef931 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd3584bf265fb638d702599f98fdf602b9591445 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78a64d063e555c03c6295ab574dc10fac99f788bd88d12b414d493db0825e8d3 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdfa5374aac04100ed338fc5ab83e03f0203d917 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84821878374a9c297291bccf547adb6da424637ea3a08aa534685de470f20152 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78cf568c79b1757bf30bf868c101b3e5a2ef8c2f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2bbad83934f7c2ebe460edf15b42d8d75f85f69deb3e3f9a20ff7b520cb8aa9 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33e07ce9423981e47a8e34326823390fe3ad9228 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8ec05abb2bcba247565a8c32d2640fb3ca897864f808e9c5d654b5bcb8aa3a6 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a78faefef49dd9e1b03b0da27a372b6834a15822 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:949ae4725900378ea4074388a870342128b75862d94b356089907e316b49e6ce +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e24895d99ee12cbde7eceeb6f99122805f06960 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bb53124178ba211415094c66d182b0d51858067c803150d382ddcbc63b18002 +size 199058594 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ea9fbaba544ac3d6bb0db6c2c51ca58bcc9a315 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d67dd20379719d0bbb4243a48d9e190e6f6e61b2afc6dae193a613ee782ce568 +size 199058594 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1b6794262114a80428594130398ca132df0c098 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f84310406f22bc41ddaf57eb34f7db39000eaa716322059b96e8beda99c160d1 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..084304577c8e4707390ce7ec1ff2ee5ef2386afd --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a72395867150e8658f27eaaa3f4658ee973a23c6b154b1df0b5fecaa729e40e +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ef7b2ce1a0de74ec4965adebc2226859badf878 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:106ce0475620e24bdb338e6402fb900ed1dd574355697189950d8dacce98bfbf +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41433a1476d4a316250bc557a7bc038a660b8933 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d30464618086b3bb9ebb00168f9fcaa58146510273388f5738a0b290368c1eb0 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79ae915be5aabc37aaa377bcb230f8b4718375e9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfba7fa8342ffa839e18ebdc73f1d7a372823b26d3e850b29ec9cae76514d409 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7f42a7d03399c6ff7fe447d647ee17a3199066b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:36aeab17ff31639435932725aa9ced007d6d7b8f991910e9b13260e302ddc321 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea61752ba9e6b53d0a5815d67bae9cea24c2a084 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:834ca4c1dea2e7b4463c44b8ae2c244b93d36e6daaf69e69f3a13684e617eb4d +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a573b120f9de2bd368a450a99c68f157d1bc611 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6c6ae550ae6011fbcedf634aabb2503054ef7c270a191e9d1738bb94e94ac4e +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2cb4d5f0dec0f358aa5bc5f501ea94ccf5ab2989 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4958831c22f327f43683a4381023726af5bb78941b54f27d74da108ea9bfefe1 +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b10bb43008e4bef16911a03ac65fa4f03a0adf13 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:767278677e366578e1a2ce2ee6d702dd95a314a427966d03db8ae6cd897b4ff1 +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e058e292573ee3658005f11257e8d6b645a5d81 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25067a4a87a1342d68390e06983cada5662ff3ffbde25f4630a97aa05bbbc113 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97f60e3e57839a2ff9a8e97c71879e6aa8c7c55a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa908637f0cf3a76fa2c506e64b62390cfca3d31fd13db7e2ac657813476804a +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2590803b3a718842c5c74b8481b465f7270258f4 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54bed70cbfdf79aa72ddcf8c2d58dcf7a0e6e74011d36ca1021260038155d9f +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06826bd5218047728af840ba2487cfea7ac1e4e0 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b41b059c94ed0422d05fb40b1531936f51e74c61ff48129a9fd5d4e04fd764d3 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..727e01161919b003613758266e3b20e5540c8369 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c18ee5cae111eb789e630b6a776cb1070234dd2647fa7c14b4834187653cd7e +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..604c9676feb2ace53f42854251530fa9e20c5486 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3706f82c706fca19714d098476b59fecef11ab596a97a857598b8fab5fa8d795 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc71faaca4d55b2140b33fd0e9057ac3180a69c8 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b7b68bf71449d92035db4e537197a49d971257ac7e5a60115e0b8af165a7ad4 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eff531dd42424f75d680f856f560cffea40c0904 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bcc038b18de93dbd456c1b7fd882dff1232a99cac6dccc3285652367d720664e +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59cf84a2a5a9a2cbfa3bb6aba30f516187700ecc --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c514f176c4d49f72ab2d8bf7f08359a6bef219d82fbcd5513e27bb192280114 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16bcc0f92c5785732f7ad6d2394e283f58298f71 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbff479373cc4ec00deeb31b1a1faebd0229b7b4ea16954140c567c147b27955 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..762adf2c279a47fffb44084c6b934db6aaf8936d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b495a7fbea0b760115d3aac39dba697b81aad32fa210626f48e6f8b43a6656e4 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f0842ac1a24322040de003cbbd3e0e2678889fd --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c78d5e7371ecbe9bef9634ef0270dd5329e2d22000818c101ddd8d4201a90b6 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e415ef67c24e870f013587db28dc7cca1f5fe87 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aab30dbf5928c7a6e41645deb33848f0139c610297ea2aee7e083e544c83cc5 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..643e946318c4bbad52f08e42fa7079b908812263 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3956efc3af7f13d3c1c255517c593fbae4cbf21d4e94b30a4597aff79c3b881 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce1925e383b1a75c587541d2f84677932797edf3 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6826e38796e562281d2a60fe383cd06f9e45039d07451fce142a4061e054f814 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a7cef1a8ad486882b1c3697c7d9bfe1d9e6819 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ea557774adfb34eb24c2d6e5034a321bbf1d54f1f44a41c5c9a3c77758bb922 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bd0be58e3f7c4422f981cc4e042309beb55e0c2 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37faef6dffaccd0f64793d703b5f249bd2634878a4c000ac49614eaa2b3d088a +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84ecf0c53caba045d9d91136792103a012ce0fe5 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:468238800d053406df3b164398ee5b524f503dae761bd1e207af9748d07ed4e7 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57b6a6a5ea566d5fd4e4c83232da4b91dca6ad14 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:efeb7ca93cca4241df233cd31972a081736e9c6fc730a8cbff5069210df90760 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d693873911700f65129f346cce2c4912c4609f4 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c6a64cfbe0e04be5214abc13510b9e0651d0e37d5182c60ef04377a015b82b5 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..907f757e66ea16932b230767c3cfff1f39c31335 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbc410889c5088db53eb8d7f0af94a7942286a704d0dff624c37caf551e74750 +size 199058775 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bedba23d8a0c6ac7ab60ddf6b75eb72a55923f61 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4f69974158b0104ccbfcd0008ab7ae0a59f6b79c15ed0c8fb2b0c83ccb39436d +size 199058775 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cef353717276bced429b0e2df15bc2a8269db296 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5778756079bf15d62601541819590d60ab16a27f825400e3011a8695c224f88 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8545438fba9ed8ef9757b4267d4ac2a47468af95 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bbe1ed4e23967edc74593be7221b80a5bfdb886b633f7ece9b53e4a04342481 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0defcb0b991728a756cde7533330709aa3110c84 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9692b5f3a5da36f832e6c3222758387f0803826f117b0bbd196b515c49ca8aa8 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee327b5e121785b0e780ce3319da05e43fac6998 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12513b125c19840f54b38c7bb1bba9805ff0e8accc0b77402fe7a4942b1cf94d +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6fdefc61c18270e1aec96654a41e9e9e5989bdb9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a74e07e4eb0ff429de318ffb83cf65fedc13eb3f86bcf519721afa14dfb72701 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..215040039ecc9b9909c213d2480d3930c6e4b211 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f56da3e189fa3c358fc40201faab95ccccddc42d608f23982c7f7cf89da7db4 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d511aa31b24b005dfaa1357dd786116f2b738f38 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b34bb461e5fdb1a2f9aba5d16e75e59fb8b1b0374d5271a4994be314f63e1ac +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9036d8d2ab449986b673a1536986ca00a227a187 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b3bc51de1d960f03910988010d715df1f9427ad490d70d0a1a2cec63d7d9ee0 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50691e863c91efaa5525135593a3ee38e09f6b87 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:424241646129720a61bbe9fe8cb482cbf7e581203ff4563437d45cb396609098 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3c5368478a2e464c0f72435433a410b5f7c2fce --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d0ea6e3cae9a56583b4f4f736197923b8adf9a95b92b1bf2c2d9b3de53e33f2 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a58cb3277586272bbb9c7b59ff990b5bbbd33a6 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:150d9b4821a1bfe22d25106ae4b3e1015362fda936b7c0a511e22aca06da5c9e +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7aad1510d4788074fa89f3878bd7ae960892db0 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e57de13feeb4303894a7e8f882fdafb1c8ee9f91037dc959368fddfc3da3de5 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bb60c9e4b8ad68b76e5a018c67a6d46041bc554 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d81515879b225b793d0b1be93f23a0f3adf0dd8e84eb2777aaecd259e099ee2e +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97c3b1cdea09b6e3f6dd023e7a62ff4ca18cebfc --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2979ab1d369c75724a0f4d922b355b04c69fcacf6e5500147baf2008f45d1d6c +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7571917c2fd5bcf680f73ecc980990e9c36570ae --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:679d6ce340d424c92198408c0202c205f8a738dc8882b8554b896244623c62b3 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c51a0fb55a84d23096f6e8854424fa7b42d8a55 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dde94b6f81a991f311d0776fd7c7e90802242ef492cd9f9169ea322aed086a4 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..596cd8bd4a6be3c7bfd77e02b4bfff6457668220 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b720c20dfd378adaf5feeaf188ed93e222d47b1bd9c3e6dd3cec1544660b575 +size 199058914 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05dd04a252771d3fb785b690c4ee223eedf346e6 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:991ac05ee295df797e28e43b3600458587982d9fb529c4b70776635de3a5b390 +size 199058914 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..204e5116eec918eb0208a6c38bb96559aa76219d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91dbea3d67c20be49906b01c0f44a3aa7d085408f98884b44eed67ccf28525d2 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1ff75764fcf442d64d49a64f63074466c2dd595 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f6f1460fb0f2850495f8459ae2ced5cbab301905f0e41efc2152354d1a98c07 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12125e5e6425c72d76a14afd9345ccaa6516f6e8 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2200bf1b8b870e88ac02d6f504942984dd9cb26059a83cfd0247aa4a577725f2 +size 199058711 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..009277edf5d708083885ff2cf29e99d9865980d7 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86581a0fce95da03113b426691919988598dabd2300828468e2d8c43e5a093b4 +size 199058711 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d8b2e726d902928f24ed1793d020ce7509d0c34 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c8633b3d8f1469f1a4303c20f257eb68a30e2100c4810cb05c09dc904c6486f +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..839f6e2bcb7296f6f787233e9a8e9380994f469e --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f59a4bf8a2844788c23a035ef84aac560e88f67def8e6d0d97fcca2dd35575d5 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f03ed0970bde143a26399c60e22fcac79b9b6787 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e47be07d6e4cc600ca2311da2ac87509d8437edef90eb5b376658688e70699f4 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69f966d823bd0046186f89992a655d5c05ed899c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c11808378021c2fa25653eca1166ff325063b6ba95e6a4af50d30a4254935dbf +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ddcdfc975745c61c395f604781fd379108a058d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9d68881fd97992e3f8dc3bea15e3c7009ec9a90d431d5972ac45f187bebbe5e +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..feecd9f19d8ac2b0df4748d6e53ff1a07541968f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5e6c232c61b927c9974d827659bba73a2c6d662664e0364af360efe75a579a3 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c7b39d2cc035d4d500f3ed86ed16a6af02c4321 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14f4320c23c8383baeea975c90e63b88f34a559ad732560104d80bb0eed885f7 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e4675acd7d99bbe29974dbffab791fde40197946 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04b370d16cd087c8f341db7b60cb017ada904f4d045857af172b92fbc4fc6e82 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c27a12768bc1d1e6e6ef1df77bc153928882951b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8c2750957f7d73da11381f377d6b98a566f68db310a931b3876904c31c22cd6 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..364aa0f90f49ad639d43c0ce174176dbc0d24a04 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1eb0ba25114a10bfa8f9bc7a1512eefa800f5afe1b9c37481cf1414442dfce6 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..125d98d8301914da1a3296a4b4065ffcc9dae35e --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d17c5659edd87a91c45699b7582f33b6e53b231e57e3e05aa34fdfb380b42bc2 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b52dd50460971e56a8865f5398dcf60da366f01 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:322ae7e5687eefa29d1e1e6ec4d4890d8920d3a02cd9f3e06cf2aa474b65fa75 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64a4a482fc1dff4fcba6fe6dbdc4c8966d85e663 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cad788b9e546db1248d0ade79fe1f1e0da9afa5a29cc667ff612b3d45ef77cb +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0457f574639645e12c3d020116203e9c4c397db9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcddbec980758849822e23330bcb2b4833a62aeac826ce9b050a5392e60a8dfe +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d2fdaf922c7e7bb3eecc51d406b5f31365bd342 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68dcd67a5c27e4073dafc77c04c5109bfe6fbd79a51f1284b0f0c7931a95a2d9 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e406954c9bad9dbbd21c299b00af48d933e5f11 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50fb3506ab3a396c271a9eccb8c7fe3f570372551f6a9df0cd4ba6eed739838c +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61a3dc545948afe0301f53249af11109e3032b37 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71caa839e0155a2e577c294e47b1b098fc0d2d40da68c0212d9dcef6dbd3e0bf +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55b369a5748c7f859af89eee6f83242cf9ebaa89 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b520ed45d5b2581dfa76d7bbb214c027e9b0d3b30fe99c3389031c3b1d151eef +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d381f8e9ff2da98259c00181b0ab7bf8ee88c983 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e79895ba99eb28c9e3d2b88e7841993cefc7d18778569643ac48ba693d0d1a56 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bc9ccd306224e61a26808195f0bd1a6bffe8867 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:21248c6f90b2dcebb59bd15cdb9630fc53ee44845047fa830006e31ede0c2353 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a62f2e1c323437252675e326c7b9961dfd53cde2 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a0fab8662f0af539e19a2baf41f9ad38229115ef304b317e6515d48cd35e204 +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae12ed49414161d90ca219ad9d36ae31a32fa5c0 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b98edced55feada8f8fb5ba5195c5f8aa2158e2e15b6b3f947660d428ef99e0 +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75acb5312cab71193364b99b17b3c425bd6e101d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d82a98b3d2b075297ce4314f3bcf398d98a04fe14bac1d18669b84b0c9bb28b0 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e24472a7de691d4d0479166229cf7086093aa977 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ace0cfca015d72bb1d50ff81ea388d4e77a292099193deb7d7f047fd34e7bb6 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85952505725135bfbb0d85fd15bbdd9867f69245 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc829e487d8bddb2d39579d1c0dd55901211da957779308fc3fe15f2c24c4199 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43f47e30d4873f58dc35abed9bafde8d334cc5d4 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baa15641aeb87be9020fa9e037daab2aef5671b5a5da61af4849843c9a48e6da +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8cb5616ab2c3c7d757349b38b80de5467951df8f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f0363d75fc7a1318751698d5b070256d829792c77941843118211388c54ffb4 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdad936b021ff66521037c526ee46472f76b5d62 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:711f0cb3ea45794ec34d13d3377eeee1eb3ed351d125b515587e096c64103043 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee8e32b526f6c65fe55ed71c0d0490f2a43cbd26 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99aa014a5146e547b4b0e75d7facaf28c057ca2c8c8bd33e2095cee5bb3916ee +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c871996a341fc938ff1fb97af3e1c3047a3623ac --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9978dc17254af6ee23aa053e865d00fc8ac3c7fdb0e70954ec1283282c76683 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65ba65db62b23f1b80235326082affa743a97db6 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:989d4b42db6e8507bcc09776a0fecec70ccf303e0c46d74c29e9868c3f0bc8cf +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7858713e9b7c51a4d48927b12cf190de8a53ec02 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d159b9a430041d874c81c80d66738ac6b68f41bb6d2423e7203b83732f8c8e4 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85eb52401b32c3e02d017f3fb7bf95ddc96cb5c6 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dc11e72c760fe2aba2db86c6b5c5d903457fd2b0681fde7ae6a9dbcccdd946d +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f835c1a3ca2f96b0248f2da113a152f6c5f924f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8986b2e74711546726059b61eae03b54b8b3997dae00461aa4da9ea9eabf055 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9559d96417ea22f0b1405d84d36570d7a0e1ed67 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7cf7ada7a35640c58ebf3ed8975b8119449b22a08a7186e6f83b161ab808b35 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..747550b66ce3853a2358ecbcd52a05b97ae2ffb0 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34b3ac99bcb11d1c495e5daef44e43279f221eef191dd65042b1dfb0709df1a9 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b32d30ed15eddea96cf214edf6698893b7b7225a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b72e3e90c4562f012972b99177d23ebbe5220c64d2e0a369baafda4c3b8e0327 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..356d6de0d1f64167e85e43026fb3c3ed7723bf53 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8409e463b72c1f2f077dd494c2bc5544a869ba2454ec920a429371f7c9c9f130 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..44fb29a5321b5bc4ec30f1df817a4a09841a563a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad0046813a9a818701b4321a1d3d06d0de9bf6244df9a48e3f8d63634e86ba43 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebf85d54fce6aee321014d20cce335cc0d997701 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1b6b5379ec8e07f19200915b675da473b5c06e0fe04ebcdd95ecd5259ff40a5 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ca403dc48701c17fdd8275f7571a3f2cc358ec8 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76dc4ba7e2a93b02993c65350385c4f6d6bee1557d5d7fd061228d871280708f +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f91bcb32a796bdfe5388059254580904d10b0007 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5362c199bf546b7f163613413f69c85dd3b2e027086ca340d00462b523b0220c +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ca5fe20636d905b06446d0faca831b7b6b3aced --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f947f4f1da94903c3591ec653a1eca78c0fb6e03b3c7959c3f85cd5a9d3e8ec +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5deab7d8bdcb8f03350cdfc7736c38145b68372b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bf2b881b8b37a6de7c76ec5038e340816494a9674ed997c5649996ecc72084e5 +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5497a40bf1632ad122259fe5850484ee793c0038 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:127ccb244ab3247aca811cd520fabeeed50e73421a07d00b0e1ba980a51ea72f +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64c8ebeec7d10201fea414127f20068049932f2e --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cb042aff49b7ee2c6d517c51d44bff63c8ffc2b202a4925a55f69e9cacfdd17 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af3b5cb5c6102b2d34e9ce4c0c4cd39cbee993cf --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7264f0efa379b78f6cd081f7fa16d8c0c6b26c36e8a3c11673150187d3517270 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2b44559b029bdfa42cc26aadce5b53024b8cd12 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a1ede1299f9559ee9ee9f1f549996fb83166f0a7627bf8ab19305a2bc6839e2 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49d93559e209a8133f1804078499e28f65ec028c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f69ca9161242a791b1fa7c36521da6a161ccf7efc29a1d6ffd289fa108eefe6 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d8032b4cba3771b641c19f8b1bc01ad92401c24 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33252c1a684f5206a50527ee44feef257c084d5a8614f91be66a9831754a7d5d +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ffbe076b6ba6591329b8b318d37376c295aa2d1 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfb7037cf16de2071fc09156ab78afa29edf680dbc49d79551a0e675d7ced6c6 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1878794f1fc256fa6fc9dbb11870d4aa42d08160 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78ff292b9289b6d31eb52cfcb983e0fb4b2d465d692874c8d2e1a5549e1059f5 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7787871fe4f57bc7511cc3dceec6e9e4bc259a3f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af2d46bdc9aca30ae767cf5167ff7e4933a8f25af30202d72fc3fb90efc3c307 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..617d7550446b81837140848dfa7b1ee41b363a00 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a469c09d74fbfc071b753c300e6df756eee02a6f25dddb0a058180fb30f7f69a +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..923f000a23195525c9e13a745c13eb855b3a597b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f807a85e038e415d8992e064728d6261324136e3bf43e09eb5e475865c9283f0 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6434402c5e7a82a474e1a9aa7600213791f57753 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f2a9c3c0fe4505685c76b976070e8a38a7c61f5f7f040429c7f58401ac9cfb9 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3078196bcfd4e9f9775fa6f1148c6b92febe6b86 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25e5e4995e343cd59b296d956565eb4f0cf24694c8bf277a5ec78ddb2f1843af +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad2c3be62aac25f7f94849eda425c20720e1571f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c17ff32795cd6e2cd8aaa1018989734fd0bf032bcf48d6548f20f69b3fbc723 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a26707a9ca6aca1e83b9492e9f5e842421f88b3d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f91cc6b03a9c82dfdc3ea8a15965c533920ef00c466bbb98b7a8ee544bbb2fd +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02c9190d852455268ab01208c519cbd16dc8278d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7436ae5e6d9a59b6aac6333616fe81f735829ade0a85c3abb641072b7099592a +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04d520b026304c0b94309632d51b589d2cdf290d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d9a30af36bb03c26c57998ca4e0cc80e4930f66b6b91cabb6b3983e3c857433 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa91acd95594ecc9d045fb23b28037c56d2b305f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:603a82ef4fb1032b8bdb7ef70998d6d65d7e89356193737f3e7dd8f3291e43ba +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c42cdc3dc70d14410fd636002209d644da07fd4 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:829c8e3ef895da77f6e843f100e624f3c20205a740c18afc7eb70a05a6daf866 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31e23b031b9e680e7263a8040b22b4546a996c44 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d433578bc896736df1cd3bab2ac740fed1e1c4b9d1e65c7023918d2a1cb56086 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05bd404b29f6ef50295b831eeb2714f3b4bfa88c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfa2360eff26d09664a8c8775c812be7ea6248011d4e9a6fa044e50a8cd791bc +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed199c21015b3c3bde11c8bb1e4f0ddb65a944bb --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ba1c826c65ad744925461f987017d0529f93005e6ee7bb58d2422833069c25c +size 199058647 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2becaa13da79588003a7da30403452129473b1e9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc79577371e220070a070300068c2cb78f1b8bf6a6c1a844a45bd3ded64d549 +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b142cedbce977a6876f339e42e3f30b03b3ebfb2 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:40f20b675847b9649ca8297b46080b5b17a17d8c569d51ed72c0d2d01d6f743c +size 199058850 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc1a1d9f1f12a444d1534d70002928747cd5461d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b23693503dc025e9d287721625ae7733ea391a1d7b2dae2615935ee9ab06c480 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5955d714a7d58dbca19a75bb5d88dd5585546a1 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30a0d6179ad2ca7be8b4d783d62182741427be3a80366e1431df326498e8e709 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a648b540b7807e30aeeccd0f68bf73a7c7d0053d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b41d10457fd09ff0e765505b220cb4dc73a9d00e8391d67e567f33ba19222485 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a34fadafa8585e362357d5f08b574009b39ddf38 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d177c9182d39d9f356f32f9269bd2e1792736041fd2f5f2c7d8dc1e7ca6af9b2 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c51a88fea929cfe2674ada9e3107315542fe28e --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3396e19e8490eb4a217766910a0041b314c45475b31db31583d406d4d5a2510d +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01a9d5ed00b9c4b1be1291577c117864c7fc1016 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9579748405e0d52fba6ba4c62470030e9b8eeb5e24a1ae4f6d44437bc77a798b +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a424fac3cb430f296b48d0c818aeb77d7441fdc8 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cb2b9cfeb37c0a7b5716af5524c9281936e44db6fd19d95aa18650928383e78 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b61b55efdbc57b70ccc55b437329be910c266d9d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c1d433224887a837b20919c740469db81f8c5778f6f9822e457568736102e46 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83fc49992a26e445ebd99b96bfbfaaed0b1594bd --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:17739103106baef8f8d58cbe1c0f596f7945493f5e3d4a71854403ae8cd8fa57 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2fc0ac86d46ea896432314187edea601878e9cfd --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aa44a1cb5eb5506aa128bee35287874757b2f2e594e18c6334a5738e113991d +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66fa98af243b0a14676e32419cec91332c0d0cac --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:836dbe8465e9ba35cbf3aa82fee19348ae03ece48db32ddadf6f94dc210dbb24 +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4972505210b9ada508c3ff66f1221905b9a2534a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9cfb45ff017a4f2e913059b03a7d6ce9ef809b8488e3a3cb336f4f3fc79633d +size 199058722 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa6dc10cb9c998fab0012cb0c854f7dcf0e997a5 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f247ec338452edceb081940cdbbb41a6457c58feaa9a361d92d8a4ff17ffa01 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfdb35bee2827cdc0186cfab8c417e7af20a2100 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14533805d1a09fe4239aea776620d15f92ea3ef131240ba686cd4d322b6ad933 +size 199058786 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..937853815667c88ff17e9199cdcae4c873d8d7b2 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b69dcbfdc79ecb2f8db318c04efc6c013e772b5a98b067f8ba686842ce98a80c +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77c18b89f2d1e017df05df7339e6768c63968e26 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e205cfa0f5852f9ea38aeb22cdc9743a468507c5374b802579de1f2a4a5de8d8 +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..873ba5c343a665cd3d9497835c8c5db6005326b3 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c13bd007957b9be1ffa3f592c979af42a5bed46afc8fb70c14169c8fa21822c +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a91a7e3f8a7265edd480872f7f880c632619bff --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e16a8bd871fc135d0eb04abee5b56b8be5ed21bbaceb1499d15cae5edccc6bcc +size 199058658 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..823a68d965a89180714f195a37dc3a08cf979e50 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f2371febcbeadd89725bf5be73b105ce4a67018105aa2557bca7ad622ab7dc4 +size 199058839 diff --git a/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..071c038c9714a00db44cf224f542155bb0fb5622 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:72ca9291df2ed483daf78c32465d647cb7c6994334cd7f6f203ca0a31378d996 +size 199058839 diff --git a/4b284b1b9c4seed4/global_step80108/layer_01-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16a126e3061043935c90e6186d9d528652ec4bf9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:766644b0e111667af3eb723f219d073c4dcad6fc2af95bc14d1d9700d45b1c62 +size 167511299 diff --git a/4b284b1b9c4seed4/global_step80108/layer_01-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb3335ff7e16eec3588b20ff35d89d59dbf3a7f6 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1bc19b8da1c9cf717915e561f73b7af020d2a42f18a0c1136e59206a7df5482e +size 167511299 diff --git a/4b284b1b9c4seed4/global_step80108/layer_03-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad4af712cc1b51737df8aad124efe707d535b0a9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30ea126b7e885177c6513eb01013addfd81cc3eed2298946a8ec00ab9ff1bcef +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_03-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da19cba8f0ea4f0c03f7ed71aa34082ff41c79ce --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4281e390068ff96d22ac5a50c9438dabde0d32aa840075624f03756341fa1a90 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_04-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d78b9b7f9fa99763c6aa48cfb2f513a83a8b3915 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60f99f06d9855007ad71fab7fdf47a971927a6cba9d826be34362877bc035773 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_04-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62395758662fe3860828c7734b5f6f7cd6ff147e --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76eaa21f375508cafa5990c6e21d027d73a6cc979615db569fc73f6f38e9e55a +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_05-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24f5639523c5edb870603aadfe912e3e52e4a5e6 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f12dba61c64a80294f0b807187ce63725b3584d7ee940f56b7ddf5f8f566e401 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_05-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16696e54726f9a78fa0259c7801462353dcf2624 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:535d6222f6a074d55e0da0502df4b2b9828f61c23878cd93656509f3b4eaaa3f +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_06-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9db4626bbf4e663269830c2bdaf3abaf15a3dfa --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2cecc881ca8af86d62b89fc700fbe9f0aaac38741b364089424db621b2f9134c +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_06-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..084937ae8a1ba191536d1836987106c1262c8962 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:754ee79681a5d71cfa19bf107f247e2919f9a71c0997d6529f56af34308ccb1a +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_07-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9fb586667a817aa44e77cf7f3c65c584274de9cb --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05781dc470b2ada04823d1846f06a25631967578b79135802f60cb04d354d052 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_07-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4435bd9c190d2f7a4fae7ed00f9859019de11ff1 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c74615e5f393f51640d5837234161aa637505c2d9944d07e7c603ca8522fd79e +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_08-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56a9f8bdec6d72c878a6b61e44de6f4109959d00 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fbee57f907a6c07b5427c92c216148fc9673ab88019633950948b530c9f0e0df +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_08-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47042abc9111dfb7a0a19c31a6bacc13fdbfb5b4 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849d9a698daa7d375eed54904f47293e5b4dc9e7e25fdaf7e41d92dc1c52d825 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_09-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7986c4bb7ff96b0997ea3fef3e8310b57e7ae930 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cabbc65a8aa6188e8799ae4bae71969cc1d3de78ecf81e07c63fa50743a8c5ed +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_09-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a712b19c673c266857cf5c238d713db5233b72a7 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:863ee1e1541b0d228bcf5448ac21a8252f190256dd605303ccbb66e094ab3959 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_10-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa732e3e045bc717bd33daffa50a1001be9251bc --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed2888fcf7d3b7201b820bfb525f67b2f4f71df0bc84f55de469d4be0aef903f +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_10-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1fedb735dae482c57a391a6c76781b80480d280 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58a09877f1be473408dbc94d2fedeb91d1520c0ae26db9d0eda1a1079adf6250 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_11-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dffaeabd6ed0e283b78853e35d7dc9e169f583d6 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfade4a696856780655837a08fea145e273f0dd1ed4484b1fd1e3ed942aa537f +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_11-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a1979a2b851b4b6d4a15b462919393041f81546 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d5f3b8c471b1be01efeae8485f3619fc1cda32d5855872c23f7ea0bb732fdfb +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_12-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1de21bf40567f11fda5aa67426d9118290e2a0a7 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce69df156b8b7dca1e6b4cec9f45def71d9960527757c1b28620e0d5bd6bbfd6 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_12-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d58278fbaf5b85b6d2f655724b07243551fdfc9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c38732180036ed3fcfd4d4f31589cbd74ec9b0388647f1d7dd81b304ca898c05 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_13-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebc87ddacfb608c7ea7376ac73f5f2d6b6f347ac --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0af504bb08898e2e9ee457e8b82a98895a0b4d4d79863507410c0732e2e88b7 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_13-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..990cd30b706be0f7028962e9cc0fe8ac604b56fb --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85841b819116bb2e53b5e0fb7575fd6498558fe3323b8702ab7e43042ee29b6b +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_14-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8e18bdbfb939424888cd49bdc86c3d40c5804bf --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77b06a9fdef2461edb574fd96e75123090cec759bd23e0f20ab4403d29941967 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_14-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d6ce1ba11809dadb6ec3c1af75428d879bcac58 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35ab623714378306957ef50dff742f25af6695e5bd7f9358fc8e934f7bbf5c9a +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_15-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d4a206e370c927633d79f57dcd3e21b18f2016d --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb505f133399c6fb6cd1ba717bab5f4eb4a51b368096128d2551b4b9dfe98ad1 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_15-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8364278677d64eab6bedb9588440b6fadf1ac9f9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2edcd24ce4753a9d3e5559ef800cfaaa0603168e61836194fbed3742e688eec7 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_16-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..319b1bee6339971fc97ce78271e038d9abc60cc3 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcf6b2d32d441b7426ca2d920364dff7e0f943c4762ff3b913e21904d82da32e +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_16-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ce04378264565be850b86108b40397a6b4ceeba --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31ebfa270a3d99db8788d5c54fe933ce392f25fad14977220c87a5d249b6c530 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_17-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23f24a3c7524e4daf2d5a8e2d8aa6cd90b05f0b2 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9084edd3d1a29caeb98256e41b09e4d2b72951388bd9e8e1d4e37d2a0d84cf0 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_17-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..112ef1ca4417be25919b9f8c15c70f9f26699f47 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2c774a8066ee80646a857679f44584c04bf67a80b12549d6c38c0fede989933 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_18-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d43e11c8e07dba4367574b8b695578528273bc1c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a75da6c4db15b79dc3da328d3106ac41e833c566b9bd830cbdeabc0787a58d18 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_18-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1d0062f686c4dfa5edbbe21a8c43fad50193715 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:172eb6880fb2d2066ed972744c37d7dcc8e1d481b10bb7911c9cbf0a9fa3848d +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_19-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bc8c605cbf797b2e741d6c8f9c3e7aed609cc21 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7752ccf3b519316b20e61482f4a42016bd15aba174178b880a10cedfc853fd77 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_19-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..258d85daac80c2155d313ace08ba1470e4ab4587 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37e0cf597dafd2e1eb69b4df318f778ff420ce888daad5ce9110ce95c03f46eb +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_20-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..505ca0b25c03564c16fc104530b3a442a3a518f1 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a64b6677756206603a56e58eae955e446e762378580b22f1965659e76f4a01a +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_20-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..768f22c366375cab788f94c8c50b867daee56472 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c21cc09089c6c77df1e95d56adf1c33aa8c9f9bc8fa123c08001e1901acecc3 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_21-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f795a357248bf65be913cb4416e0281b31a2efd --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c61d43cedd9058b351da5545f54ec4fbc49753fb8b4bf97e658ad9a24fac07c3 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_21-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7187d3375c63130ab1839faf86599148be070ab8 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb38b6b5b22064bfe332e235b2ccc61953de89527551f0e60b21cd67dc4300e5 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_22-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..860d5ab90fa73e29f15ae2bff284d4fa643e8044 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b05b6f1ed7d587dc1d7c494a948d704a2fb9ebb4f0bb4c1259a8516698c66c3 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_22-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7415d87735c09655064ac7d32b3f1e9f2d04a72b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8765b5954c2e08aa061db7742df26a2975451e830096d2a33de78db9ad1e2c2 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_23-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed49fc1557cd44fc0c619a96c4a0a860dc2f58a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2edec350baf4ab13c7a1af81aff644cd137f7705f9638a30018ac9b4c642911 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_23-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6344c6fe8f41a4a62699290088b52b2afe8083ef --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71f0c08287773beb6c4afc03ba742891dc56c0dc5b5262bb8b436eaa8944fc95 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_24-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..673bfaa065655aca6f0acc9d754dd2f91db6030c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1189b6878b3b539f9368df79ec9f5190d9d39b039130e43e6b7a64f5b7dd26d +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_24-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a871269bbf18368d5e7998f360e4adec619b72f1 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afc40a14e7669890495f07d986a8b6f2d5533175207fa7acb2c31088bc478e83 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_25-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3792cd8fa31f8696b553c58f4328de33011c746f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2c08341aedc8010099945d809a82c4b63271d544422ede6c157cd15160a2ef0 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_25-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..722075ec48d3f6802906217aa8636152d0c42fb5 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:780314331725b5f234fdf11b80cc67fcbc23ff0cfd4040de472c022415ffc84d +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_26-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48090b2599bbc6fb550f5209a2e33b8ab1226b39 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f00790ca0b0a61f099581331d02ce25f807a070f76a7b03bc41cb8e363a943a +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_26-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad72b4d366c10dca19a1292a46b5ef02b3143677 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a3803605d81e2e2beb0657a1e0fc929f8c26f50a25246f89c30c13d275312e1 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_27-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7793f2a99671a64e30aaa3169dd25286b38ad61 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728afc4529173252f418dc3163edccf6e787c7142253968f43322c55597a03f8 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_27-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79a1389a7fbb825a4e3d77f53dc030c0fb3ed0eb --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88ef4d3e2e8a35588ea08608d738e1ed1f3abb2fa3507c08964ce62858db8fd7 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_28-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a318854573485ea0a6c28ad46505f29f415009b5 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02960365bae8a8440357e9e0c765c05581e3b2e616a9a369c47da29f1d764774 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_28-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47170e9fe1296d3508876c120b69115718a5930e --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b06be77ed9ca6ffe3f7eefce57abb35eaa784746890d030f9ced5eb160868dc3 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_29-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c542de7cd21631f2a871cfddf4b7f72fd1fa026 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53a1162fe557f6e2c0d7bde34bc524c32040bfd52cae8d2e33233cf87801942c +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_29-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1918cbd6249bfc1cf99a4a4388812007666cc5e4 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b24f5652cec26ca27c875e0098e023388eaaaaa82827110319f4add715ae3710 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_30-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ad9eec7bb42d36484293fd4bc19cc69b18a93ec --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8c28ad98010d4c3bb9dfd158901595f4497dd5bee3a26cbe4846b59f2c14752 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_30-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..259dadbd380b267acc4d52fc56d8bf4fabd79a64 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9efd56cb897ed63ea78bc7ab69422d3e5e4439c2ae17057b238cd402e8519c85 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_31-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2975b17216a4838edecaef90f789e55d06281c2 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e312b074cc8305e96bafcaa0811f7c84219ed4d2ccf9ad39bf4dd59e43ae7df +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_31-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7137bd16d1a8293f73cbd1de20b4fb6a39dde1c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc2265f51627822425a64b1037935f739523da42390f3293b7b5b1ee6e213324 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_32-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4fc7914da383b6f63f2e9c9b63613cbe89539ff --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d4b56dce4923503076b1e32b010129a7148a365623fa4b5f720084be0ffa977 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_32-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e3b60715ca8c13ed7be72aa6be975affcd9db60 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:551c6d462f093a97460e90855e7b99e76d8f0f84f9a3ea0294cc534487dfa341 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_33-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc24cddd33a27a6030930c385823cb4bf5280657 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:669ab831eaaa9cd1a7929390fad7c87c0247a73ee4e45dc43de0fb1e82da63c7 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_33-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a5ee9ce080ef43ef95ca2a2f1dd6f0a230938e9 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a49559dd212417fcb83bd8fb69c5395986e592873d7b7f0ebd4b92b110cff15 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_34-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d58f62b0f0b4dc529bef8e292dfe2b47b0d8a54 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c56856e088091e6643aea3fae7f164d94a4ae3337cd144d42b96269b36c09a34 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_34-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e6f3c07fe1753d21e69def215779ddde06ae564 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3104ed7574964f334d1a09954135db1944189b554767d0178732699876bb8da +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_35-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1fb4f046cd92241dbf1f7900386329db9b2686f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccfe6060ac51e2d04020752ded80c117e1af755e8af0298b324ae7e88fa330b2 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_35-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc8ccdb3b993873948466bc878c13e39173b50a7 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74225d977bd52dae5fc1be9d5c4275fa4239cf5bbaf2d0fe8ac231390bd758df +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_36-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc8b9292c0156983aaa779eb8af3eadef92c7d2e --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42bf2e0fd9359d9f9130766f30c98e75d76b4251a13af4c84a8c1f156eaff7d5 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_36-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8db3591f4513e4a40e2c59b969e1a0af2e70339 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b9d2201ba621e617f21a44fba90379dd0d9956d69ed0a84fa32afe2c6faaa8 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_37-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29b107160700bd638535ac2ccc7db45b9e84099c --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:75f940e5cc415f62cb5f71647b5df696cb04d2355e371d5efc460076494f6453 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_37-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfdb657fa9bf086e1620b140a9fa8505b497ba2b --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e0d8ea4a8497a8bd383d207b1ced472d472c7ea5f348d8a26529f0bd47fa08a +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_38-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..73644e3a7cf895eada5b75e2d11266b11702862a --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe41bcd50ea6bc17ae31adb676e44c5a1f831d79bdcfde2db5f77a82fd542229 +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_38-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd636e7576c89eb44dbf445dfc8351fbe3c43a5f --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2a0c3a3b81a76233b3560bea2a122c48732b39e2b2f3e0793de0cbfe72c18fb +size 113308931 diff --git a/4b284b1b9c4seed4/global_step80108/layer_40-model_00-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0d341ea6a7a153b3359ebda370a53a26e2b59d5 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37abb8d44971c9ea7001f60922954ff3ab3788478d2ef167561a0d4cbb3a21e2 +size 13507 diff --git a/4b284b1b9c4seed4/global_step80108/layer_40-model_01-model_states.pt b/4b284b1b9c4seed4/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8250a8f84b17b0e1d0c818b8efc52a9c418f9d0 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651ec9a510abc0f5f0f5d582ebc403b78dacfa02e1575ca5e822c241bc22894a +size 13507 diff --git a/4b284b1b9c4seed4/global_step80108/mp_rank_00_model_states.pt b/4b284b1b9c4seed4/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7548f1b3637846caf72fdc56e3a82a48920cc4bc --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06bdd84230dd0bbb0fa4c9ec7f021e1cfc4b95ae628eba2695df5dfaf643b753 +size 51443 diff --git a/4b284b1b9c4seed4/global_step80108/mp_rank_01_model_states.pt b/4b284b1b9c4seed4/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0fd7734b55019cdfbff1f515dd289635135d0b6 --- /dev/null +++ b/4b284b1b9c4seed4/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f10881cb0e1f818d69a72bbc3e024e5751dcd61f22a05e10527aa58e1edc0391 +size 51443 diff --git a/4b284b1b9c4seed4/transformers/config.json b/4b284b1b9c4seed4/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b1b9c4seed4/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b1b9c4seed4/transformers/pytorch_model.bin b/4b284b1b9c4seed4/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..44c9905c9d500d3b901022598e81d4f0cee8c5f1 --- /dev/null +++ b/4b284b1b9c4seed4/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0fd94d9cd7c46f7c9db61aeab78ddbe2d7ef670640f5bf982a6fa92d5a61fe53 +size 8781203669 diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..012d1d60d1084b478a31eec1bbed1bea1f195408 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.34350884519310554, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.038772150149038065}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07173003966213615, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001891427473975356}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.28960101855358183, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004686243089174828}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10544276754647447, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021544893348497355}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03426167301990358, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0012315349939346193}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1392743239236764, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0032402937101130005}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05038765662771961, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013708215929186423}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06788583144299273, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017322495246173835}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2789368995485402, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004534363609043255}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10030410348988913, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001982177743894177}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06804073106746164, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017862439598119247}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2748870394126657, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004363263583019278}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10000096230678256, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020180656843696763}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cc4debf36c192f4a703321ff25adc99ddaee7d7d --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4045455604224073, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0236576374456469}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0658970899010487, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014479646288584037}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3525261563529861, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0050415399648793355}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10223984226049061, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00175780338655891}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.029637673551245882, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009108165706734375}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1656326153435222, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0035022509689606276}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04600863612485982, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011042614632539437}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06067096918490614, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013097575690947149}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.32060026791609386, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00440422446137861}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09408291635077375, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015927729242144477}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06224519569533051, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013718123071500563}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.33007977466199706, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00463723121449382}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.09636959670083528, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001661162141611167}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4dbaa703fd466ebec132e93778cc860e54bb922b --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4841613222907723, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.015039273978834939}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06966385259464293, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013937412637180038}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.37512398125219343, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005116912749333124}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10929288546298149, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017988667388595812}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03198301338818694, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008718774993262271}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18094325736423483, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036323707654308335}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.050112452100538586, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011570842093378976}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06360059097903424, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012449705718618718}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3388899116424299, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004438023718580559}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.09977161025587211, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016243784066598424}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0655984906937379, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013223896668450679}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.35115785035117936, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004705333926430955}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10273089804493778, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016928851028229573}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..7c79cb4df2515d45223316fd55eab62af55e1741 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5848578510766751, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02382820842952149}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07146406939302619, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014453804488559735}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3923331320425209, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005255569174563494}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1123642181797315, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018086780742506458}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03311041175360562, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000955769810908034}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19200440577658992, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038021308525194295}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05189108829034796, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011675575856479941}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06458792165995919, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012821596441060375}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.35290395771176203, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004621707552330829}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10153877113079328, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016163226649112037}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06707064624330737, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013662159713619777}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3662637426139491, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004856741037403349}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1052784059414783, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017096425628278053}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a6d7f848ae1ad9e48aed17a004ff4c5159143c8f --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5815622592156788, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.029409084100340988}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.073350621026601, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013008441046774397}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.402711193766134, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005268855314940937}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11600454183618039, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017414056230866818}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03375946119188094, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008125358382760585}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19912887839246102, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003887307664703985}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05350261302900716, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011180842631744589}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06666295825312767, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001186073659230382}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3633610895084421, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004665095807994941}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10528355390377818, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015840788654041859}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06900491931707611, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012357509964065728}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.37672100976400624, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0048637174582481756}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10893873510925292, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016436803370992086}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..637bbb3dd9ccfe60e374bd82a9ba5c7ba1525922 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6292734470145089, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.032038534440523625}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07430554120104693, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013333669684835047}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40910724158477596, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005285245988912935}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11745960029316531, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017300682232481712}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03448188474999599, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008618085647059942}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20431478176242832, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0039032533628420053}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05452068929305587, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011284229311503077}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06699056196994188, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001214766584623908}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.36652587603372083, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0046510504742824435}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10569984600090632, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015559332991619912}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06952080008680515, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012664771484443501}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.38090153422695555, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004832634454846149}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10969123482143882, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016247884404989854}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f15da65683654c2451eacd2af4ffb2c19ae66259 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1501551653167452, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019145985531852103}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2489709412710993, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002565698467707567}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1735899714732908, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018379295907133386}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.030202594861558258, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000759198757195269}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05179351194647759, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013706134138774457}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03527159968688606, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000856000364522866}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11587674124907248, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013578078418251586}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.19905321222991249, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002072708736632529}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13542458385119363, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013094512830872681}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.13806383555422214, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017411900348176868}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.23066945559291627, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0023890574843587445}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15998195547427285, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016735883778822192}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.4638786550080012, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08267943817716743}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..9e82c560009613d13bf2d7805b9e02054b4a846f --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.17561493820630653, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002048580212979638}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2975242805713054, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002661646132459767}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.20517386588028216, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019096420138433956}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.038705255482649484, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008641576645556467}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06721747132871511, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015546205463413934}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04509174855817, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009362703351931108}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12348273344528769, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013241963423884194}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.2182708873208918, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002078335701646665}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.1461985663690308, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012629826687957297}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.16411787830700947, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001905726984632049}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2793462022470309, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00252183230288639}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.19199261777381824, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017768312743395834}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.251037388830426, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06386416803226096}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e4a50c7b0609d8efa4390c1eeb753a857868e013 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.18279672864000174, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001990030228234584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.31492793105361294, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025616011512098248}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.2149553929096824, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018159340053845016}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.042646009741889805, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008649264691986515}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07496946538732863, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015594180926328848}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.050099922234849326, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009396332686045797}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12807089612938685, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013124423288503014}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22896480825128132, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020362817656302}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.152189270942713, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012132534448735604}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1719794802172194, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018519473657900671}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.29789003880343934, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002450408388704567}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.20261963860140034, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001699260136326749}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.638972923238051, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04079081483713292}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..6273fe14cda2c9b5c571c0e1c122ddc41f1ed913 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15880336071647017, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022944434654695485}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.26506418569211093, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032637292322135534}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.1811722525980339, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022088859505497234}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0374298998336526, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009347509198517388}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06524543251395427, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001603994023546246}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04316445582714641, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000956046878850861}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11189815593178445, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001600964481991733}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1930856830862472, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025117226250944077}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12842259890093402, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015101623900602265}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14949474498482374, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021540706302144844}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2508189749530171, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0031145852012745777}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1708671620256238, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020803868308500607}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.7817782152958124, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04494580041852014}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..591924d9215b829a18e6b9cb520f763c0ba3b489 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.0526082191649819, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019579711254660813}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08887123055545011, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002973119831747629}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.058148219500646206, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019439260562197995}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.012404560376357416, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000765615351847643}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.021336430842142755, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001118116808651589}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.013391403283503953, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006305028420949355}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.038334561197559465, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001465640058040743}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06619947973463458, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022604433031636296}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.042154106197481285, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001383034127114084}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.049466020968478554, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018544231085558262}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.08334408075199987, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002792361572274234}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05448171126882292, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018181715140947877}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.5997291080192819, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.034966523246928005}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..cabe9729fd7f0be18bd9d047962489531667dd2a --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.00828795189621696, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008084030145764894}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.013904833680136126, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013152248622154829}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.009101109725055801, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.000849061484627802}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0017579778442265573, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00022272256203822104}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0034824583016457547, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004707745855497479}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0021173402290246453, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0002651969883574264}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.00606164612301448, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005820824170547412}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010516775330575035, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010286453150278683}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006671364196388791, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006155682683130244}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.0077547689033896795, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007519757597042171}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.013113865139552568, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012437323588959986}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.00852403124177262, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.000789483822967171}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.0320053783861012e-06, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.6548309745966328e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ad6ad7a09c5dea37037bddceeeb77a03f0e2d6ed --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 1.4456822172834254, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04276533070237041}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.08084608817477075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013037630358869862}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.16055476672730024, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0022564902307428436}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.10550747830492155, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001600046418184004}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.0180883910143694, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006324971623061661}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.03352985411112681, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011860257734223087}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.023111704860364103, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008023451007582199}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.07897160421844947, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012157586325601468}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.15704150708399545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020880518954252106}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.10309579699961463, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014856345287328617}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.06566532991903784, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00115593325264158}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.13043930012149813, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0020438483091751833}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.085687119444743, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0014326281774339593}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..adee0249cba407f453562ca58b075cc497342b11 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 7.854550343569453, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11842361375802873}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.35242925608961834, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025862879156174677}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4593871286009479, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027718307444898073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.37960517377654424, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021312179107678742}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.15016846460595357, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0016925643088238768}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1987661075234813, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002085741403395336}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.16225548525605324, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001628980531143478}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2535878033618753, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018603284522068176}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3373488751020238, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023042860742874356}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2751099734003478, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015986731793980245}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2947167761956799, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002321783937504011}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3850310566251188, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026364808102144186}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.31764028681903844, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020166639615139246}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4f0383c0fdfee2a29366c0cc70b2a60c94dffde3 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.584259500465588, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1544206935916045}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4101598697462684, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002246311055501821}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4603951235406536, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002736343584240638}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.41716631446436636, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001904443983975073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.1817762545465421, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017054003975476711}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20814546072005263, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021073018090344247}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.18592733733343356, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001651511887316203}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.29271400984628115, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018520206075962242}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3307167069836982, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002352222065176941}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.29825905325627894, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016671912167031061}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.3438330605735075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021559258341024025}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3863382687718853, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026264477519150294}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3497622641102556, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019222555310956092}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4f55b68bbc2357de217d9187edc70bcaa3db6327 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.005027804713954, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14913713325107694}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4128283610854264, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00218582649540743}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4617654209580726, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027204559282358}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4199469764935773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001866102905923008}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.18554586275444523, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017040263392683272}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2117021500635163, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002152756842715476}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.18965165207657023, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016611244058807987}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.29313420912472204, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018337994526123047}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32931921594254, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023370831957328685}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.298413421066599, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016514441907895666}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.34697556096050464, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002097945215373547}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3888925774714783, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002615178055125266}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3531127839068146, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018773997153010787}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..695f806162fe397539e67854089cf205d8e84b46 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.363725115618854, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1349892134607558}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.41369428294464894, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022630498681273214}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.463073205676912, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002620101280268744}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4214008037563902, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018957274669436463}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.18853767720104403, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017966301373649335}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21376292605494995, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021133996361269876}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19224882966800977, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001688941669379114}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2947773213194346, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019453260402410404}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.33160719324501514, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023386028746102032}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.30045503720645306, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017243402211031724}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.34793871661300624, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0022022816802554548}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.38987225844490936, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025624343675698957}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35440044254437, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001939185206150459}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..0bc7eeb2f7074cb26c18dc7a25dee181608cbc0a --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.396192996497414, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16654357094855035}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.415343404582103, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022395714603746343}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.462339881403203, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002606515070610007}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.42256346127489886, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018711992463432423}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.18874947831873545, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017363983679664929}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21329100699058842, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020862831128997342}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.19258472578075223, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016595774845375585}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.29366555957532514, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018624351126946828}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32911404216108797, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023155754665530786}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.29935707532452077, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016828692465751755}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.34963846222070455, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021787598409919178}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3890874281204962, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025265070175629857}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3555436949251867, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019127831146169912}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a5992282166cb5b45db8f70f2ecf6a782712e255 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.15422621570346934, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020039005936603317}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3506635490563916, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0042556493547655115}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20889878659689404, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002458161766680771}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03307990095257621, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011002276404168225}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.07910944220650014, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026293603468150466}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04565942952067972, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001484562672483921}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.11490133308951496, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001481297426684668}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.26284399370938016, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033084414512192374}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.15587034501708355, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018431637093872144}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12158807333409381, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016089880194761488}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.278789316707468, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00364738944247525}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1651849748571103, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002039061494531475}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.8234981410881652, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09861688194525574}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..f4d26b5d76a027c6d9fe00bc68644b184b0ed435 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12978400090119854, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018214048412026733}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.32027413224988105, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00416743115408514}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.18254418171842912, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024443411491113813}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.025920284045820686, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009915583067368265}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.06631766447507839, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026016286386155744}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.036825241144522146, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014067669670603119}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09779168145477703, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013336831707437397}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.24393449987832236, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032690620169295624}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1379121041144307, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018159806506780998}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10419708360998835, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014908021891115058}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2591470200293115, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035902088886349626}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14685271867556554, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00202786402481471}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4511145888771138, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09215852910549645}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..614aae411d2da4aaa2e2b1616c708486de1d8593 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12682893488466288, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018115124386976255}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3129238773710033, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004144317584991236}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1784133650153775, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002434527345664647}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.023792739813654398, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009538695469598671}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.060628286518002124, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002544171640335871}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03377646994942601, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013577113683580135}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09538132852222156, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012844315555328582}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23736904076265325, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0031180197306729797}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13445676544883162, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001742983161792639}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10150079343006048, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014805542361053387}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.25224041568358746, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00356325287772434}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14302327166537732, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020121565752601223}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4173910716715976, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1269050055569669}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..20650cbe735115dc3980448f5e0d4f526409b65e --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12682835665999379, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00213008962319155}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3009777871605996, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0045155564803296844}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17405000505151677, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0026158795444079694}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02441534481786468, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010675183688113013}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.060023335309239284, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0025544641047680868}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03375564198727498, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0014032677780195426}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09672846502785581, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001605939754348312}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23129794905638065, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003504325859643222}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13287002402660542, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019574198182001363}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10242219504173285, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017649678079630277}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2447872835150151, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0038950725453768833}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14072796227018858, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002188698179032325}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.4410854543220795, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11065939978206533}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0d725fff15d0a1ae8085a42c714827083bd97538 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.041064589753945765, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002574722440175742}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07375404829054749, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004261542973214119}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.046992144100321806, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002618786666967082}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0072827259137400735, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008839873299209189}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.01434569739075993, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014362041655696376}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.008636963128827568, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008391846215142884}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.03137075485796663, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020006363883442293}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.05624031413634613, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032626943561910897}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.03548036137516894, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001955807555849124}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.03357423627999912, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021310282339018806}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.059996937228044826, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003508594344969223}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03810619457684465, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021359009016179383}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.6753547790268645, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09678811316166971}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..dbfb99544cd5d94ffd708251f8f40b36a9e4f9a2 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/agg.4b284b6bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.002394598265414318, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0007029813930147865}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0019954716710551207, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0005584193559240988}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0021338767527660316, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.000606716788713842}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0001469327010392493, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 8.511648046715374e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00010241330996047977, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 5.9726635104036084e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00011901404509555748, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 6.872962972148577e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0017715789785566055, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0005103213321970242}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0015030111824248839, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0004165975224565321}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0015909130557671355, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0004446509241590643}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0020245246393824, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0006015169025391406}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0016826910638698292, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0004718028635824783}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.001799689332800904, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005143272355042585}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 3.8720991740133824e-38, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 6.757775100349013e-33}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e40f07d7ffba0ff6ff1c7efbb4c07c1621586395 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9f4461888b0786968e04a53e66c8d83fa848f70aedbdb8813943aeff15ab462 +size 4135392 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6c7a827340725f0649490db5accf92668122b112 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b97101fde5af27cd6a2a28b53aaa581c05301f35c31b502b36d2738a308879a +size 5210086 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..0008e23071f77ea8f5c183e71fef139836d2e32d --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41fb511065f37bbcb1b5f2c1d604fac8b1cb94fc426b3b9d3a57c8dd7a8d9d06 +size 6093771 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a4616e7602f1fa9bc6571331780fdfa77dd9bc37 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f07899f01d991dda37755fd5079c2e2e1bbab743ea9cffd34e0cbce8acb54728 +size 7006046 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4829533e812e3e699c01e1d32ccc2171640ce5e0 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60b25ae5fe65910ae46c15f2f93f988bb4f801174db5020714e17c488a1cdbc2 +size 7899695 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..def1b4322c7c275c4357d2105b059cc79cb62b60 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:651fc41d3388fb6d2503c0435d0c1a89abf4d9e49a6f90d4fdda86d5315586d7 +size 8793943 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..76dbd0b55e5e9e66f7c1332f7b50d943bd3d09da --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e33a70bcacb3ebc379b981c08791df2b581e89d66ba7ae375da336042b9d5cc +size 7684227 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..bad9778848c4fbc01072f376ed23bab4580f5864 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:265c9b0014ce281daff607674788b9f6600152ea8cda8118f829293d9428052c +size 13326356 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c4b09ea0457e269fc263264a31e388b8b14ac290 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e9d738828e4fa8d4faec595795d4dfc708fa02cbfceb3e486be4c5a2caf75ad +size 18929635 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6c3c724c89598aa7e2d7957c508ea7c7390415f7 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09313549f646feb5f69ccd34772f3bc45c2b44ea1e83ffec80231633134b8098 +size 24348447 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..60f5901a65233ba90a7b631409b06ae876546ecd --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:354e1a737d37a49cc971eb7307088a1ea8327b39808dcc8bf92fbb7f77df038c +size 29479617 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..86fc27c02d3936f107d3157fb90b70b3c9990661 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e25d2b0203e86a29f1e36fd8d091ec096026da31da8061141543d97f82cb985b +size 34801261 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e002ea1e24aab527cc82df661070fcea9e597cdb --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:530f45997fdbb48a801b8c75050bb3e2ce869d116f0fb54c11b2f49e3f7cf2e4 +size 4412187 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..90a03dc105c8b53275bbd742f7022e8a9a04e2b3 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0777d6d3d083621872b1834fb34d9d65e749d930659df2ec0ff56886f2acb00 +size 5289642 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f26b2b22ba31c01eda41f46d26df0b267450f828 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81b26e3c152da7bea7c0e186a88798b341d8fb862898d238bcf7cbba3cf3d97d +size 6258617 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..69da8208d030c9e37b88d865e6a421f4382eeffa --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1addbfc267b2c55a24afcbfcdd7aeca553d8b78617ebdbcfbc27561cd8d49f4e +size 7337025 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..11151f6cb7eded291396d6aa3b4a3ec5860c61c0 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53e4e61c3275a7657cfc6c0cc986da54cb797082612135e7b2b4032d4185e7de +size 8419972 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c611baa0d645460b21281ef94dff79171dd82f2d --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:390a81384aa348664fb403912e8ff7609104d6cd12bbdfcca289b90e9b0c01a1 +size 9501237 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_0.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..835c079738c331105e0a0578203b58de572607cf --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b83f652c0bb2052afd20c5dc0771f5c65486178eb3cb56e4fed8ca50b496ec2 +size 2820789 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_1.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7d12ac0de9f72f1524d155af004e95ef1346f3bc --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7cacc9cc7e4fb91d18f2f74881b8bd499cf9f2aae74abf117a7a750ecc1236d +size 5104268 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_2.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d91e3032a65e6a736a99a298a11362798282f0aa --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dae945d28ec7e918618b994c79f809023a065e2c13634829b1539171c53407e +size 7378145 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_3.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..320ca820904c5811463abb3feedc2f7f61d2aef3 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d43016945991573797a32e4b8afc3b471aa655bc46b260f966069d91e2ad1ab4 +size 9645695 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_4.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..169ffdb532b31a263e6f111b1b3ea73174fd1030 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44c51f6ff3a2e640fac697865392430aa72cadf8a155bb171d0d46a8ea1521fe +size 11671629 diff --git a/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_5.jsonl b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cbbcd2c241af95eb9ba7525366998e46748445e3 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/examples.4b284b6bc4seed1_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e903ed9af37a17db873227e84295e921bb4b952d7f471b464f77e183de18235 +size 13897551 diff --git a/4b284b6bc4seed1/evaluation/generation/merged.csv b/4b284b6bc4seed1/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..b61feb8e2cb7cafc5dd3e24d5271c6eb0d4c95a8 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.023111704860364103 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.023111704860364103 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.16225548525605324 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.16225548525605324 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.18592733733343356 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.18592733733343356 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.18965165207657023 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.18965165207657023 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.19224882966800977 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.19224882966800977 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.19258472578075223 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.19258472578075223 +e2e_nlg_cleaned,5,average,multiple,0.1576299558291972 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.04565942952067972 +gem_xsum,0,median,rouge2_fmeasure,0.04565942952067972 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.036825241144522146 +gem_xsum,1,median,rouge2_fmeasure,0.036825241144522146 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.03377646994942601 +gem_xsum,2,median,rouge2_fmeasure,0.03377646994942601 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.03375564198727498 +gem_xsum,3,median,rouge2_fmeasure,0.03375564198727498 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.008636963128827568 +gem_xsum,4,median,rouge2_fmeasure,0.008636963128827568 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00011901404509555748 +gem_xsum,5,median,rouge2_fmeasure,0.00011901404509555748 +gem_xsum,5,average,multiple,0.02646212662930433 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.05038765662771961 +web_nlg_en,0,median,rouge2_fmeasure,0.05038765662771961 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.04600863612485982 +web_nlg_en,1,median,rouge2_fmeasure,0.04600863612485982 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.050112452100538586 +web_nlg_en,2,median,rouge2_fmeasure,0.050112452100538586 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.05189108829034796 +web_nlg_en,3,median,rouge2_fmeasure,0.05189108829034796 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.05350261302900716 +web_nlg_en,4,median,rouge2_fmeasure,0.05350261302900716 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.05452068929305587 +web_nlg_en,5,median,rouge2_fmeasure,0.05452068929305587 +web_nlg_en,5,average,multiple,0.051070522577588165 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.03527159968688606 +wiki_lingua_en,0,median,rouge2_fmeasure,0.03527159968688606 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.04509174855817 +wiki_lingua_en,1,median,rouge2_fmeasure,0.04509174855817 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.050099922234849326 +wiki_lingua_en,2,median,rouge2_fmeasure,0.050099922234849326 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.04316445582714641 +wiki_lingua_en,3,median,rouge2_fmeasure,0.04316445582714641 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.013391403283503953 +wiki_lingua_en,4,median,rouge2_fmeasure,0.013391403283503953 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0021173402290246453 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0021173402290246453 +wiki_lingua_en,5,average,multiple,0.031522744969930065 diff --git a/4b284b6bc4seed1/evaluation/generation/merged.json b/4b284b6bc4seed1/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..9d49b18e9d6a3c3919262382b1571b5771ac9ee6 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.34350884519310554, "bleu_stderr": 0.038772150149038065, "rouge1_fmeasure": 0.10544276754647447, "rouge1_fmeasure_stderr": 0.0021544893348497355, "rouge1_precision": 0.07173003966213615, "rouge1_precision_stderr": 0.001891427473975356, "rouge1_recall": 0.28960101855358183, "rouge1_recall_stderr": 0.004686243089174828, "rouge2_fmeasure": 0.05038765662771961, "rouge2_fmeasure_stderr": 0.0013708215929186423, "rouge2_precision": 0.03426167301990358, "rouge2_precision_stderr": 0.0012315349939346193, "rouge2_recall": 0.1392743239236764, "rouge2_recall_stderr": 0.0032402937101130005, "rougeL_fmeasure": 0.10030410348988913, "rougeL_fmeasure_stderr": 0.001982177743894177, "rougeL_precision": 0.06788583144299273, "rougeL_precision_stderr": 0.0017322495246173835, "rougeL_recall": 0.2789368995485402, "rougeL_recall_stderr": 0.004534363609043255, "rougeLsum_fmeasure": 0.10000096230678256, "rougeLsum_fmeasure_stderr": 0.0020180656843696763, "rougeLsum_precision": 0.06804073106746164, "rougeLsum_precision_stderr": 0.0017862439598119247, "rougeLsum_recall": 0.2748870394126657, "rougeLsum_recall_stderr": 0.004363263583019278}}, "1": {"PALM_prompt": {"bleu": 0.4045455604224073, "bleu_stderr": 0.0236576374456469, "rouge1_fmeasure": 0.10223984226049061, "rouge1_fmeasure_stderr": 0.00175780338655891, "rouge1_precision": 0.0658970899010487, "rouge1_precision_stderr": 0.0014479646288584037, "rouge1_recall": 0.3525261563529861, "rouge1_recall_stderr": 0.0050415399648793355, "rouge2_fmeasure": 0.04600863612485982, "rouge2_fmeasure_stderr": 0.0011042614632539437, "rouge2_precision": 0.029637673551245882, "rouge2_precision_stderr": 0.0009108165706734375, "rouge2_recall": 0.1656326153435222, "rouge2_recall_stderr": 0.0035022509689606276, "rougeL_fmeasure": 0.09408291635077375, "rougeL_fmeasure_stderr": 0.0015927729242144477, "rougeL_precision": 0.06067096918490614, "rougeL_precision_stderr": 0.0013097575690947149, "rougeL_recall": 0.32060026791609386, "rougeL_recall_stderr": 0.00440422446137861, "rougeLsum_fmeasure": 0.09636959670083528, "rougeLsum_fmeasure_stderr": 0.001661162141611167, "rougeLsum_precision": 0.06224519569533051, "rougeLsum_precision_stderr": 0.0013718123071500563, "rougeLsum_recall": 0.33007977466199706, "rougeLsum_recall_stderr": 0.00463723121449382}}, "2": {"PALM_prompt": {"bleu": 0.4841613222907723, "bleu_stderr": 0.015039273978834939, "rouge1_fmeasure": 0.10929288546298149, "rouge1_fmeasure_stderr": 0.0017988667388595812, "rouge1_precision": 0.06966385259464293, "rouge1_precision_stderr": 0.0013937412637180038, "rouge1_recall": 0.37512398125219343, "rouge1_recall_stderr": 0.005116912749333124, "rouge2_fmeasure": 0.050112452100538586, "rouge2_fmeasure_stderr": 0.0011570842093378976, "rouge2_precision": 0.03198301338818694, "rouge2_precision_stderr": 0.0008718774993262271, "rouge2_recall": 0.18094325736423483, "rouge2_recall_stderr": 0.0036323707654308335, "rougeL_fmeasure": 0.09977161025587211, "rougeL_fmeasure_stderr": 0.0016243784066598424, "rougeL_precision": 0.06360059097903424, "rougeL_precision_stderr": 0.0012449705718618718, "rougeL_recall": 0.3388899116424299, "rougeL_recall_stderr": 0.004438023718580559, "rougeLsum_fmeasure": 0.10273089804493778, "rougeLsum_fmeasure_stderr": 0.0016928851028229573, "rougeLsum_precision": 0.0655984906937379, "rougeLsum_precision_stderr": 0.0013223896668450679, "rougeLsum_recall": 0.35115785035117936, "rougeLsum_recall_stderr": 0.004705333926430955}}, "3": {"PALM_prompt": {"bleu": 0.5848578510766751, "bleu_stderr": 0.02382820842952149, "rouge1_fmeasure": 0.1123642181797315, "rouge1_fmeasure_stderr": 0.0018086780742506458, "rouge1_precision": 0.07146406939302619, "rouge1_precision_stderr": 0.0014453804488559735, "rouge1_recall": 0.3923331320425209, "rouge1_recall_stderr": 0.005255569174563494, "rouge2_fmeasure": 0.05189108829034796, "rouge2_fmeasure_stderr": 0.0011675575856479941, "rouge2_precision": 0.03311041175360562, "rouge2_precision_stderr": 0.000955769810908034, "rouge2_recall": 0.19200440577658992, "rouge2_recall_stderr": 0.0038021308525194295, "rougeL_fmeasure": 0.10153877113079328, "rougeL_fmeasure_stderr": 0.0016163226649112037, "rougeL_precision": 0.06458792165995919, "rougeL_precision_stderr": 0.0012821596441060375, "rougeL_recall": 0.35290395771176203, "rougeL_recall_stderr": 0.004621707552330829, "rougeLsum_fmeasure": 0.1052784059414783, "rougeLsum_fmeasure_stderr": 0.0017096425628278053, "rougeLsum_precision": 0.06707064624330737, "rougeLsum_precision_stderr": 0.0013662159713619777, "rougeLsum_recall": 0.3662637426139491, "rougeLsum_recall_stderr": 0.004856741037403349}}, "4": {"PALM_prompt": {"bleu": 0.5815622592156788, "bleu_stderr": 0.029409084100340988, "rouge1_fmeasure": 0.11600454183618039, "rouge1_fmeasure_stderr": 0.0017414056230866818, "rouge1_precision": 0.073350621026601, "rouge1_precision_stderr": 0.0013008441046774397, "rouge1_recall": 0.402711193766134, "rouge1_recall_stderr": 0.005268855314940937, "rouge2_fmeasure": 0.05350261302900716, "rouge2_fmeasure_stderr": 0.0011180842631744589, "rouge2_precision": 0.03375946119188094, "rouge2_precision_stderr": 0.0008125358382760585, "rouge2_recall": 0.19912887839246102, "rouge2_recall_stderr": 0.003887307664703985, "rougeL_fmeasure": 0.10528355390377818, "rougeL_fmeasure_stderr": 0.0015840788654041859, "rougeL_precision": 0.06666295825312767, "rougeL_precision_stderr": 0.001186073659230382, "rougeL_recall": 0.3633610895084421, "rougeL_recall_stderr": 0.004665095807994941, "rougeLsum_fmeasure": 0.10893873510925292, "rougeLsum_fmeasure_stderr": 0.0016436803370992086, "rougeLsum_precision": 0.06900491931707611, "rougeLsum_precision_stderr": 0.0012357509964065728, "rougeLsum_recall": 0.37672100976400624, "rougeLsum_recall_stderr": 0.0048637174582481756}}, "5": {"PALM_prompt": {"bleu": 0.6292734470145089, "bleu_stderr": 0.032038534440523625, "rouge1_fmeasure": 0.11745960029316531, "rouge1_fmeasure_stderr": 0.0017300682232481712, "rouge1_precision": 0.07430554120104693, "rouge1_precision_stderr": 0.0013333669684835047, "rouge1_recall": 0.40910724158477596, "rouge1_recall_stderr": 0.005285245988912935, "rouge2_fmeasure": 0.05452068929305587, "rouge2_fmeasure_stderr": 0.0011284229311503077, "rouge2_precision": 0.03448188474999599, "rouge2_precision_stderr": 0.0008618085647059942, "rouge2_recall": 0.20431478176242832, "rouge2_recall_stderr": 0.0039032533628420053, "rougeL_fmeasure": 0.10569984600090632, "rougeL_fmeasure_stderr": 0.0015559332991619912, "rougeL_precision": 0.06699056196994188, "rougeL_precision_stderr": 0.001214766584623908, "rougeL_recall": 0.36652587603372083, "rougeL_recall_stderr": 0.0046510504742824435, "rougeLsum_fmeasure": 0.10969123482143882, "rougeLsum_fmeasure_stderr": 0.0016247884404989854, "rougeLsum_precision": 0.06952080008680515, "rougeLsum_precision_stderr": 0.0012664771484443501, "rougeLsum_recall": 0.38090153422695555, "rougeLsum_recall_stderr": 0.004832634454846149}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.4638786550080012, "bleu_stderr": 0.08267943817716743, "rouge1_fmeasure": 0.1735899714732908, "rouge1_fmeasure_stderr": 0.0018379295907133386, "rouge1_precision": 0.1501551653167452, "rouge1_precision_stderr": 0.0019145985531852103, "rouge1_recall": 0.2489709412710993, "rouge1_recall_stderr": 0.002565698467707567, "rouge2_fmeasure": 0.03527159968688606, "rouge2_fmeasure_stderr": 0.000856000364522866, "rouge2_precision": 0.030202594861558258, "rouge2_precision_stderr": 0.000759198757195269, "rouge2_recall": 0.05179351194647759, "rouge2_recall_stderr": 0.0013706134138774457, "rougeL_fmeasure": 0.13542458385119363, "rougeL_fmeasure_stderr": 0.0013094512830872681, "rougeL_precision": 0.11587674124907248, "rougeL_precision_stderr": 0.0013578078418251586, "rougeL_recall": 0.19905321222991249, "rougeL_recall_stderr": 0.002072708736632529, "rougeLsum_fmeasure": 0.15998195547427285, "rougeLsum_fmeasure_stderr": 0.0016735883778822192, "rougeLsum_precision": 0.13806383555422214, "rougeLsum_precision_stderr": 0.0017411900348176868, "rougeLsum_recall": 0.23066945559291627, "rougeLsum_recall_stderr": 0.0023890574843587445}}, "1": {"tldr_en": {"bleu": 2.251037388830426, "bleu_stderr": 0.06386416803226096, "rouge1_fmeasure": 0.20517386588028216, "rouge1_fmeasure_stderr": 0.0019096420138433956, "rouge1_precision": 0.17561493820630653, "rouge1_precision_stderr": 0.002048580212979638, "rouge1_recall": 0.2975242805713054, "rouge1_recall_stderr": 0.002661646132459767, "rouge2_fmeasure": 0.04509174855817, "rouge2_fmeasure_stderr": 0.0009362703351931108, "rouge2_precision": 0.038705255482649484, "rouge2_precision_stderr": 0.0008641576645556467, "rouge2_recall": 0.06721747132871511, "rouge2_recall_stderr": 0.0015546205463413934, "rougeL_fmeasure": 0.1461985663690308, "rougeL_fmeasure_stderr": 0.0012629826687957297, "rougeL_precision": 0.12348273344528769, "rougeL_precision_stderr": 0.0013241963423884194, "rougeL_recall": 0.2182708873208918, "rougeL_recall_stderr": 0.002078335701646665, "rougeLsum_fmeasure": 0.19199261777381824, "rougeLsum_fmeasure_stderr": 0.0017768312743395834, "rougeLsum_precision": 0.16411787830700947, "rougeLsum_precision_stderr": 0.001905726984632049, "rougeLsum_recall": 0.2793462022470309, "rougeLsum_recall_stderr": 0.00252183230288639}}, "2": {"tldr_en": {"bleu": 2.638972923238051, "bleu_stderr": 0.04079081483713292, "rouge1_fmeasure": 0.2149553929096824, "rouge1_fmeasure_stderr": 0.0018159340053845016, "rouge1_precision": 0.18279672864000174, "rouge1_precision_stderr": 0.001990030228234584, "rouge1_recall": 0.31492793105361294, "rouge1_recall_stderr": 0.0025616011512098248, "rouge2_fmeasure": 0.050099922234849326, "rouge2_fmeasure_stderr": 0.0009396332686045797, "rouge2_precision": 0.042646009741889805, "rouge2_precision_stderr": 0.0008649264691986515, "rouge2_recall": 0.07496946538732863, "rouge2_recall_stderr": 0.0015594180926328848, "rougeL_fmeasure": 0.152189270942713, "rougeL_fmeasure_stderr": 0.0012132534448735604, "rougeL_precision": 0.12807089612938685, "rougeL_precision_stderr": 0.0013124423288503014, "rougeL_recall": 0.22896480825128132, "rougeL_recall_stderr": 0.0020362817656302, "rougeLsum_fmeasure": 0.20261963860140034, "rougeLsum_fmeasure_stderr": 0.001699260136326749, "rougeLsum_precision": 0.1719794802172194, "rougeLsum_precision_stderr": 0.0018519473657900671, "rougeLsum_recall": 0.29789003880343934, "rougeLsum_recall_stderr": 0.002450408388704567}}, "3": {"tldr_en": {"bleu": 2.7817782152958124, "bleu_stderr": 0.04494580041852014, "rouge1_fmeasure": 0.1811722525980339, "rouge1_fmeasure_stderr": 0.0022088859505497234, "rouge1_precision": 0.15880336071647017, "rouge1_precision_stderr": 0.0022944434654695485, "rouge1_recall": 0.26506418569211093, "rouge1_recall_stderr": 0.0032637292322135534, "rouge2_fmeasure": 0.04316445582714641, "rouge2_fmeasure_stderr": 0.000956046878850861, "rouge2_precision": 0.0374298998336526, "rouge2_precision_stderr": 0.0009347509198517388, "rouge2_recall": 0.06524543251395427, "rouge2_recall_stderr": 0.001603994023546246, "rougeL_fmeasure": 0.12842259890093402, "rougeL_fmeasure_stderr": 0.0015101623900602265, "rougeL_precision": 0.11189815593178445, "rougeL_precision_stderr": 0.001600964481991733, "rougeL_recall": 0.1930856830862472, "rougeL_recall_stderr": 0.0025117226250944077, "rougeLsum_fmeasure": 0.1708671620256238, "rougeLsum_fmeasure_stderr": 0.0020803868308500607, "rougeLsum_precision": 0.14949474498482374, "rougeLsum_precision_stderr": 0.0021540706302144844, "rougeLsum_recall": 0.2508189749530171, "rougeLsum_recall_stderr": 0.0031145852012745777}}, "4": {"tldr_en": {"bleu": 0.5997291080192819, "bleu_stderr": 0.034966523246928005, "rouge1_fmeasure": 0.058148219500646206, "rouge1_fmeasure_stderr": 0.0019439260562197995, "rouge1_precision": 0.0526082191649819, "rouge1_precision_stderr": 0.0019579711254660813, "rouge1_recall": 0.08887123055545011, "rouge1_recall_stderr": 0.002973119831747629, "rouge2_fmeasure": 0.013391403283503953, "rouge2_fmeasure_stderr": 0.0006305028420949355, "rouge2_precision": 0.012404560376357416, "rouge2_precision_stderr": 0.000765615351847643, "rouge2_recall": 0.021336430842142755, "rouge2_recall_stderr": 0.001118116808651589, "rougeL_fmeasure": 0.042154106197481285, "rougeL_fmeasure_stderr": 0.001383034127114084, "rougeL_precision": 0.038334561197559465, "rougeL_precision_stderr": 0.001465640058040743, "rougeL_recall": 0.06619947973463458, "rougeL_recall_stderr": 0.0022604433031636296, "rougeLsum_fmeasure": 0.05448171126882292, "rougeLsum_fmeasure_stderr": 0.0018181715140947877, "rougeLsum_precision": 0.049466020968478554, "rougeLsum_precision_stderr": 0.0018544231085558262, "rougeLsum_recall": 0.08334408075199987, "rougeLsum_recall_stderr": 0.002792361572274234}}, "5": {"tldr_en": {"bleu": 1.0320053783861012e-06, "bleu_stderr": 1.6548309745966328e-06, "rouge1_fmeasure": 0.009101109725055801, "rouge1_fmeasure_stderr": 0.000849061484627802, "rouge1_precision": 0.00828795189621696, "rouge1_precision_stderr": 0.0008084030145764894, "rouge1_recall": 0.013904833680136126, "rouge1_recall_stderr": 0.0013152248622154829, "rouge2_fmeasure": 0.0021173402290246453, "rouge2_fmeasure_stderr": 0.0002651969883574264, "rouge2_precision": 0.0017579778442265573, "rouge2_precision_stderr": 0.00022272256203822104, "rouge2_recall": 0.0034824583016457547, "rouge2_recall_stderr": 0.0004707745855497479, "rougeL_fmeasure": 0.006671364196388791, "rougeL_fmeasure_stderr": 0.0006155682683130244, "rougeL_precision": 0.00606164612301448, "rougeL_precision_stderr": 0.0005820824170547412, "rougeL_recall": 0.010516775330575035, "rougeL_recall_stderr": 0.0010286453150278683, "rougeLsum_fmeasure": 0.00852403124177262, "rougeLsum_fmeasure_stderr": 0.000789483822967171, "rougeLsum_precision": 0.0077547689033896795, "rougeLsum_precision_stderr": 0.0007519757597042171, "rougeLsum_recall": 0.013113865139552568, "rougeLsum_recall_stderr": 0.0012437323588959986}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 1.4456822172834254, "bleu_stderr": 0.04276533070237041, "rouge1_fmeasure": 0.10550747830492155, "rouge1_fmeasure_stderr": 0.001600046418184004, "rouge1_precision": 0.08084608817477075, "rouge1_precision_stderr": 0.0013037630358869862, "rouge1_recall": 0.16055476672730024, "rouge1_recall_stderr": 0.0022564902307428436, "rouge2_fmeasure": 0.023111704860364103, "rouge2_fmeasure_stderr": 0.0008023451007582199, "rouge2_precision": 0.0180883910143694, "rouge2_precision_stderr": 0.0006324971623061661, "rouge2_recall": 0.03352985411112681, "rouge2_recall_stderr": 0.0011860257734223087, "rougeL_fmeasure": 0.10309579699961463, "rougeL_fmeasure_stderr": 0.0014856345287328617, "rougeL_precision": 0.07897160421844947, "rougeL_precision_stderr": 0.0012157586325601468, "rougeL_recall": 0.15704150708399545, "rougeL_recall_stderr": 0.0020880518954252106, "rougeLsum_fmeasure": 0.085687119444743, "rougeLsum_fmeasure_stderr": 0.0014326281774339593, "rougeLsum_precision": 0.06566532991903784, "rougeLsum_precision_stderr": 0.00115593325264158, "rougeLsum_recall": 0.13043930012149813, "rougeLsum_recall_stderr": 0.0020438483091751833}}, "1": {"generate_text_restaurant": {"bleu": 7.854550343569453, "bleu_stderr": 0.11842361375802873, "rouge1_fmeasure": 0.37960517377654424, "rouge1_fmeasure_stderr": 0.0021312179107678742, "rouge1_precision": 0.35242925608961834, "rouge1_precision_stderr": 0.0025862879156174677, "rouge1_recall": 0.4593871286009479, "rouge1_recall_stderr": 0.0027718307444898073, "rouge2_fmeasure": 0.16225548525605324, "rouge2_fmeasure_stderr": 0.001628980531143478, "rouge2_precision": 0.15016846460595357, "rouge2_precision_stderr": 0.0016925643088238768, "rouge2_recall": 0.1987661075234813, "rouge2_recall_stderr": 0.002085741403395336, "rougeL_fmeasure": 0.2751099734003478, "rougeL_fmeasure_stderr": 0.0015986731793980245, "rougeL_precision": 0.2535878033618753, "rougeL_precision_stderr": 0.0018603284522068176, "rougeL_recall": 0.3373488751020238, "rougeL_recall_stderr": 0.0023042860742874356, "rougeLsum_fmeasure": 0.31764028681903844, "rougeLsum_fmeasure_stderr": 0.0020166639615139246, "rougeLsum_precision": 0.2947167761956799, "rougeLsum_precision_stderr": 0.002321783937504011, "rougeLsum_recall": 0.3850310566251188, "rougeLsum_recall_stderr": 0.0026364808102144186}}, "2": {"generate_text_restaurant": {"bleu": 10.584259500465588, "bleu_stderr": 0.1544206935916045, "rouge1_fmeasure": 0.41716631446436636, "rouge1_fmeasure_stderr": 0.001904443983975073, "rouge1_precision": 0.4101598697462684, "rouge1_precision_stderr": 0.002246311055501821, "rouge1_recall": 0.4603951235406536, "rouge1_recall_stderr": 0.002736343584240638, "rouge2_fmeasure": 0.18592733733343356, "rouge2_fmeasure_stderr": 0.001651511887316203, "rouge2_precision": 0.1817762545465421, "rouge2_precision_stderr": 0.0017054003975476711, "rouge2_recall": 0.20814546072005263, "rouge2_recall_stderr": 0.0021073018090344247, "rougeL_fmeasure": 0.29825905325627894, "rougeL_fmeasure_stderr": 0.0016671912167031061, "rougeL_precision": 0.29271400984628115, "rougeL_precision_stderr": 0.0018520206075962242, "rougeL_recall": 0.3307167069836982, "rougeL_recall_stderr": 0.002352222065176941, "rougeLsum_fmeasure": 0.3497622641102556, "rougeLsum_fmeasure_stderr": 0.0019222555310956092, "rougeLsum_precision": 0.3438330605735075, "rougeLsum_precision_stderr": 0.0021559258341024025, "rougeLsum_recall": 0.3863382687718853, "rougeLsum_recall_stderr": 0.0026264477519150294}}, "3": {"generate_text_restaurant": {"bleu": 11.005027804713954, "bleu_stderr": 0.14913713325107694, "rouge1_fmeasure": 0.4199469764935773, "rouge1_fmeasure_stderr": 0.001866102905923008, "rouge1_precision": 0.4128283610854264, "rouge1_precision_stderr": 0.00218582649540743, "rouge1_recall": 0.4617654209580726, "rouge1_recall_stderr": 0.0027204559282358, "rouge2_fmeasure": 0.18965165207657023, "rouge2_fmeasure_stderr": 0.0016611244058807987, "rouge2_precision": 0.18554586275444523, "rouge2_precision_stderr": 0.0017040263392683272, "rouge2_recall": 0.2117021500635163, "rouge2_recall_stderr": 0.002152756842715476, "rougeL_fmeasure": 0.298413421066599, "rougeL_fmeasure_stderr": 0.0016514441907895666, "rougeL_precision": 0.29313420912472204, "rougeL_precision_stderr": 0.0018337994526123047, "rougeL_recall": 0.32931921594254, "rougeL_recall_stderr": 0.0023370831957328685, "rougeLsum_fmeasure": 0.3531127839068146, "rougeLsum_fmeasure_stderr": 0.0018773997153010787, "rougeLsum_precision": 0.34697556096050464, "rougeLsum_precision_stderr": 0.002097945215373547, "rougeLsum_recall": 0.3888925774714783, "rougeLsum_recall_stderr": 0.002615178055125266}}, "4": {"generate_text_restaurant": {"bleu": 11.363725115618854, "bleu_stderr": 0.1349892134607558, "rouge1_fmeasure": 0.4214008037563902, "rouge1_fmeasure_stderr": 0.0018957274669436463, "rouge1_precision": 0.41369428294464894, "rouge1_precision_stderr": 0.0022630498681273214, "rouge1_recall": 0.463073205676912, "rouge1_recall_stderr": 0.002620101280268744, "rouge2_fmeasure": 0.19224882966800977, "rouge2_fmeasure_stderr": 0.001688941669379114, "rouge2_precision": 0.18853767720104403, "rouge2_precision_stderr": 0.0017966301373649335, "rouge2_recall": 0.21376292605494995, "rouge2_recall_stderr": 0.0021133996361269876, "rougeL_fmeasure": 0.30045503720645306, "rougeL_fmeasure_stderr": 0.0017243402211031724, "rougeL_precision": 0.2947773213194346, "rougeL_precision_stderr": 0.0019453260402410404, "rougeL_recall": 0.33160719324501514, "rougeL_recall_stderr": 0.0023386028746102032, "rougeLsum_fmeasure": 0.35440044254437, "rougeLsum_fmeasure_stderr": 0.001939185206150459, "rougeLsum_precision": 0.34793871661300624, "rougeLsum_precision_stderr": 0.0022022816802554548, "rougeLsum_recall": 0.38987225844490936, "rougeLsum_recall_stderr": 0.0025624343675698957}}, "5": {"generate_text_restaurant": {"bleu": 11.396192996497414, "bleu_stderr": 0.16654357094855035, "rouge1_fmeasure": 0.42256346127489886, "rouge1_fmeasure_stderr": 0.0018711992463432423, "rouge1_precision": 0.415343404582103, "rouge1_precision_stderr": 0.0022395714603746343, "rouge1_recall": 0.462339881403203, "rouge1_recall_stderr": 0.002606515070610007, "rouge2_fmeasure": 0.19258472578075223, "rouge2_fmeasure_stderr": 0.0016595774845375585, "rouge2_precision": 0.18874947831873545, "rouge2_precision_stderr": 0.0017363983679664929, "rouge2_recall": 0.21329100699058842, "rouge2_recall_stderr": 0.0020862831128997342, "rougeL_fmeasure": 0.29935707532452077, "rougeL_fmeasure_stderr": 0.0016828692465751755, "rougeL_precision": 0.29366555957532514, "rougeL_precision_stderr": 0.0018624351126946828, "rougeL_recall": 0.32911404216108797, "rougeL_recall_stderr": 0.0023155754665530786, "rougeLsum_fmeasure": 0.3555436949251867, "rougeLsum_fmeasure_stderr": 0.0019127831146169912, "rougeLsum_precision": 0.34963846222070455, "rougeLsum_precision_stderr": 0.0021787598409919178, "rougeLsum_recall": 0.3890874281204962, "rougeLsum_recall_stderr": 0.0025265070175629857}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.8234981410881652, "bleu_stderr": 0.09861688194525574, "rouge1_fmeasure": 0.20889878659689404, "rouge1_fmeasure_stderr": 0.002458161766680771, "rouge1_precision": 0.15422621570346934, "rouge1_precision_stderr": 0.0020039005936603317, "rouge1_recall": 0.3506635490563916, "rouge1_recall_stderr": 0.0042556493547655115, "rouge2_fmeasure": 0.04565942952067972, "rouge2_fmeasure_stderr": 0.001484562672483921, "rouge2_precision": 0.03307990095257621, "rouge2_precision_stderr": 0.0011002276404168225, "rouge2_recall": 0.07910944220650014, "rouge2_recall_stderr": 0.0026293603468150466, "rougeL_fmeasure": 0.15587034501708355, "rougeL_fmeasure_stderr": 0.0018431637093872144, "rougeL_precision": 0.11490133308951496, "rougeL_precision_stderr": 0.001481297426684668, "rougeL_recall": 0.26284399370938016, "rougeL_recall_stderr": 0.0033084414512192374, "rougeLsum_fmeasure": 0.1651849748571103, "rougeLsum_fmeasure_stderr": 0.002039061494531475, "rougeLsum_precision": 0.12158807333409381, "rougeLsum_precision_stderr": 0.0016089880194761488, "rougeLsum_recall": 0.278789316707468, "rougeLsum_recall_stderr": 0.00364738944247525}}, "1": {"article_DOC_summary": {"bleu": 1.4511145888771138, "bleu_stderr": 0.09215852910549645, "rouge1_fmeasure": 0.18254418171842912, "rouge1_fmeasure_stderr": 0.0024443411491113813, "rouge1_precision": 0.12978400090119854, "rouge1_precision_stderr": 0.0018214048412026733, "rouge1_recall": 0.32027413224988105, "rouge1_recall_stderr": 0.00416743115408514, "rouge2_fmeasure": 0.036825241144522146, "rouge2_fmeasure_stderr": 0.0014067669670603119, "rouge2_precision": 0.025920284045820686, "rouge2_precision_stderr": 0.0009915583067368265, "rouge2_recall": 0.06631766447507839, "rouge2_recall_stderr": 0.0026016286386155744, "rougeL_fmeasure": 0.1379121041144307, "rougeL_fmeasure_stderr": 0.0018159806506780998, "rougeL_precision": 0.09779168145477703, "rougeL_precision_stderr": 0.0013336831707437397, "rougeL_recall": 0.24393449987832236, "rougeL_recall_stderr": 0.0032690620169295624, "rougeLsum_fmeasure": 0.14685271867556554, "rougeLsum_fmeasure_stderr": 0.00202786402481471, "rougeLsum_precision": 0.10419708360998835, "rougeLsum_precision_stderr": 0.0014908021891115058, "rougeLsum_recall": 0.2591470200293115, "rougeLsum_recall_stderr": 0.0035902088886349626}}, "2": {"article_DOC_summary": {"bleu": 1.4173910716715976, "bleu_stderr": 0.1269050055569669, "rouge1_fmeasure": 0.1784133650153775, "rouge1_fmeasure_stderr": 0.002434527345664647, "rouge1_precision": 0.12682893488466288, "rouge1_precision_stderr": 0.0018115124386976255, "rouge1_recall": 0.3129238773710033, "rouge1_recall_stderr": 0.004144317584991236, "rouge2_fmeasure": 0.03377646994942601, "rouge2_fmeasure_stderr": 0.0013577113683580135, "rouge2_precision": 0.023792739813654398, "rouge2_precision_stderr": 0.0009538695469598671, "rouge2_recall": 0.060628286518002124, "rouge2_recall_stderr": 0.002544171640335871, "rougeL_fmeasure": 0.13445676544883162, "rougeL_fmeasure_stderr": 0.001742983161792639, "rougeL_precision": 0.09538132852222156, "rougeL_precision_stderr": 0.0012844315555328582, "rougeL_recall": 0.23736904076265325, "rougeL_recall_stderr": 0.0031180197306729797, "rougeLsum_fmeasure": 0.14302327166537732, "rougeLsum_fmeasure_stderr": 0.0020121565752601223, "rougeLsum_precision": 0.10150079343006048, "rougeLsum_precision_stderr": 0.0014805542361053387, "rougeLsum_recall": 0.25224041568358746, "rougeLsum_recall_stderr": 0.00356325287772434}}, "3": {"article_DOC_summary": {"bleu": 1.4410854543220795, "bleu_stderr": 0.11065939978206533, "rouge1_fmeasure": 0.17405000505151677, "rouge1_fmeasure_stderr": 0.0026158795444079694, "rouge1_precision": 0.12682835665999379, "rouge1_precision_stderr": 0.00213008962319155, "rouge1_recall": 0.3009777871605996, "rouge1_recall_stderr": 0.0045155564803296844, "rouge2_fmeasure": 0.03375564198727498, "rouge2_fmeasure_stderr": 0.0014032677780195426, "rouge2_precision": 0.02441534481786468, "rouge2_precision_stderr": 0.0010675183688113013, "rouge2_recall": 0.060023335309239284, "rouge2_recall_stderr": 0.0025544641047680868, "rougeL_fmeasure": 0.13287002402660542, "rougeL_fmeasure_stderr": 0.0019574198182001363, "rougeL_precision": 0.09672846502785581, "rougeL_precision_stderr": 0.001605939754348312, "rougeL_recall": 0.23129794905638065, "rougeL_recall_stderr": 0.003504325859643222, "rougeLsum_fmeasure": 0.14072796227018858, "rougeLsum_fmeasure_stderr": 0.002188698179032325, "rougeLsum_precision": 0.10242219504173285, "rougeLsum_precision_stderr": 0.0017649678079630277, "rougeLsum_recall": 0.2447872835150151, "rougeLsum_recall_stderr": 0.0038950725453768833}}, "4": {"article_DOC_summary": {"bleu": 0.6753547790268645, "bleu_stderr": 0.09678811316166971, "rouge1_fmeasure": 0.046992144100321806, "rouge1_fmeasure_stderr": 0.002618786666967082, "rouge1_precision": 0.041064589753945765, "rouge1_precision_stderr": 0.002574722440175742, "rouge1_recall": 0.07375404829054749, "rouge1_recall_stderr": 0.004261542973214119, "rouge2_fmeasure": 0.008636963128827568, "rouge2_fmeasure_stderr": 0.0008391846215142884, "rouge2_precision": 0.0072827259137400735, "rouge2_precision_stderr": 0.0008839873299209189, "rouge2_recall": 0.01434569739075993, "rouge2_recall_stderr": 0.0014362041655696376, "rougeL_fmeasure": 0.03548036137516894, "rougeL_fmeasure_stderr": 0.001955807555849124, "rougeL_precision": 0.03137075485796663, "rougeL_precision_stderr": 0.0020006363883442293, "rougeL_recall": 0.05624031413634613, "rougeL_recall_stderr": 0.0032626943561910897, "rougeLsum_fmeasure": 0.03810619457684465, "rougeLsum_fmeasure_stderr": 0.0021359009016179383, "rougeLsum_precision": 0.03357423627999912, "rougeLsum_precision_stderr": 0.0021310282339018806, "rougeLsum_recall": 0.059996937228044826, "rougeLsum_recall_stderr": 0.003508594344969223}}, "5": {"article_DOC_summary": {"bleu": 3.8720991740133824e-38, "bleu_stderr": 6.757775100349013e-33, "rouge1_fmeasure": 0.0021338767527660316, "rouge1_fmeasure_stderr": 0.000606716788713842, "rouge1_precision": 0.002394598265414318, "rouge1_precision_stderr": 0.0007029813930147865, "rouge1_recall": 0.0019954716710551207, "rouge1_recall_stderr": 0.0005584193559240988, "rouge2_fmeasure": 0.00011901404509555748, "rouge2_fmeasure_stderr": 6.872962972148577e-05, "rouge2_precision": 0.0001469327010392493, "rouge2_precision_stderr": 8.511648046715374e-05, "rouge2_recall": 0.00010241330996047977, "rouge2_recall_stderr": 5.9726635104036084e-05, "rougeL_fmeasure": 0.0015909130557671355, "rougeL_fmeasure_stderr": 0.0004446509241590643, "rougeL_precision": 0.0017715789785566055, "rougeL_precision_stderr": 0.0005103213321970242, "rougeL_recall": 0.0015030111824248839, "rougeL_recall_stderr": 0.0004165975224565321, "rougeLsum_fmeasure": 0.001799689332800904, "rougeLsum_fmeasure_stderr": 0.0005143272355042585, "rougeLsum_precision": 0.0020245246393824, "rougeLsum_precision_stderr": 0.0006015169025391406, "rougeLsum_recall": 0.0016826910638698292, "rougeLsum_recall_stderr": 0.0004718028635824783}}}} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..5e3970149ebee20f6566870705359a62a6746a06 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.34350884519310554, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.038772150149038065 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07173003966213615, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001891427473975356 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.28960101855358183, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004686243089174828 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10544276754647447, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0021544893348497355 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03426167301990358, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0012315349939346193 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1392743239236764, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0032402937101130005 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05038765662771961, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013708215929186423 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06788583144299273, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017322495246173835 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2789368995485402, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004534363609043255 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10030410348988913, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001982177743894177 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06804073106746164, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017862439598119247 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2748870394126657, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004363263583019278 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10000096230678256, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020180656843696763 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..39b1a8dc6f20e4d635ac8dfc4abcf5932e52a829 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4045455604224073, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0236576374456469 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0658970899010487, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014479646288584037 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3525261563529861, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0050415399648793355 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10223984226049061, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00175780338655891 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.029637673551245882, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009108165706734375 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1656326153435222, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0035022509689606276 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04600863612485982, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011042614632539437 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06067096918490614, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013097575690947149 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.32060026791609386, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00440422446137861 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09408291635077375, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015927729242144477 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06224519569533051, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013718123071500563 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.33007977466199706, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00463723121449382 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.09636959670083528, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001661162141611167 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2d02be73726c0c09b9951ab73cadf6818792a08b --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4841613222907723, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.015039273978834939 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06966385259464293, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013937412637180038 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.37512398125219343, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005116912749333124 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10929288546298149, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017988667388595812 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03198301338818694, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008718774993262271 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18094325736423483, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036323707654308335 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.050112452100538586, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011570842093378976 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06360059097903424, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012449705718618718 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3388899116424299, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004438023718580559 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.09977161025587211, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016243784066598424 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0655984906937379, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013223896668450679 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.35115785035117936, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004705333926430955 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10273089804493778, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016928851028229573 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..01ba09695142ffe839cd5932be61a662bd6ec000 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5848578510766751, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02382820842952149 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07146406939302619, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014453804488559735 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3923331320425209, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005255569174563494 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1123642181797315, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018086780742506458 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03311041175360562, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000955769810908034 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19200440577658992, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038021308525194295 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05189108829034796, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011675575856479941 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06458792165995919, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012821596441060375 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.35290395771176203, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004621707552330829 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10153877113079328, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016163226649112037 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06707064624330737, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013662159713619777 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3662637426139491, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004856741037403349 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1052784059414783, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017096425628278053 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c0d927e4ef9569b8cac351ac840f46cd9e3408fb --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5815622592156788, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.029409084100340988 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.073350621026601, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013008441046774397 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.402711193766134, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005268855314940937 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11600454183618039, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017414056230866818 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03375946119188094, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008125358382760585 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19912887839246102, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003887307664703985 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05350261302900716, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011180842631744589 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06666295825312767, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001186073659230382 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3633610895084421, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004665095807994941 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10528355390377818, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015840788654041859 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06900491931707611, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012357509964065728 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.37672100976400624, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0048637174582481756 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10893873510925292, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016436803370992086 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..a12ef71a13f5f45ad051e9e55a895aaa0f4646a3 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6292734470145089, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.032038534440523625 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07430554120104693, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013333669684835047 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40910724158477596, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005285245988912935 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11745960029316531, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017300682232481712 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03448188474999599, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008618085647059942 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20431478176242832, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0039032533628420053 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05452068929305587, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011284229311503077 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06699056196994188, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001214766584623908 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.36652587603372083, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0046510504742824435 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10569984600090632, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015559332991619912 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06952080008680515, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012664771484443501 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.38090153422695555, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004832634454846149 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10969123482143882, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016247884404989854 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d1edd5af2eca4304309b670565bb3a8304bdbf66 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1501551653167452, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019145985531852103 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2489709412710993, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002565698467707567 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1735899714732908, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018379295907133386 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.030202594861558258, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000759198757195269 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05179351194647759, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013706134138774457 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03527159968688606, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000856000364522866 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11587674124907248, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013578078418251586 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.19905321222991249, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002072708736632529 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13542458385119363, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013094512830872681 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.13806383555422214, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017411900348176868 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.23066945559291627, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0023890574843587445 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15998195547427285, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016735883778822192 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.4638786550080012, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08267943817716743 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6aad5ae8796810591de0aa49e4d14041f4768e99 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.17561493820630653, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002048580212979638 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2975242805713054, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002661646132459767 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.20517386588028216, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019096420138433956 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.038705255482649484, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008641576645556467 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06721747132871511, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015546205463413934 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04509174855817, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009362703351931108 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12348273344528769, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013241963423884194 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.2182708873208918, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002078335701646665 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.1461985663690308, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012629826687957297 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.16411787830700947, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001905726984632049 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2793462022470309, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00252183230288639 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.19199261777381824, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017768312743395834 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.251037388830426, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06386416803226096 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..b28ae3c783dfa5f2cb96211c3d34201f1761ee56 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.18279672864000174, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001990030228234584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.31492793105361294, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0025616011512098248 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.2149553929096824, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018159340053845016 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.042646009741889805, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008649264691986515 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07496946538732863, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015594180926328848 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.050099922234849326, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009396332686045797 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12807089612938685, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013124423288503014 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22896480825128132, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020362817656302 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.152189270942713, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012132534448735604 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1719794802172194, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018519473657900671 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.29789003880343934, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002450408388704567 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.20261963860140034, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001699260136326749 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.638972923238051, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04079081483713292 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..4cf26291d43e753b61e7522a16acb39e811c361d --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15880336071647017, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0022944434654695485 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.26506418569211093, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032637292322135534 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.1811722525980339, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0022088859505497234 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0374298998336526, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009347509198517388 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06524543251395427, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001603994023546246 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04316445582714641, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000956046878850861 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11189815593178445, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001600964481991733 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1930856830862472, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0025117226250944077 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12842259890093402, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015101623900602265 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14949474498482374, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0021540706302144844 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2508189749530171, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0031145852012745777 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1708671620256238, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020803868308500607 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.7817782152958124, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04494580041852014 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ec7dabd0828fcf6346aa504a8de843f5de1cf645 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.0526082191649819, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019579711254660813 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08887123055545011, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002973119831747629 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.058148219500646206, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019439260562197995 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.012404560376357416, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000765615351847643 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.021336430842142755, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001118116808651589 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.013391403283503953, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0006305028420949355 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.038334561197559465, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001465640058040743 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06619947973463458, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022604433031636296 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.042154106197481285, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001383034127114084 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.049466020968478554, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018544231085558262 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.08334408075199987, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002792361572274234 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05448171126882292, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018181715140947877 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.5997291080192819, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.034966523246928005 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..f0becfca05430fdf883dee4e0fb52e2cc8d3ed3e --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.00828795189621696, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008084030145764894 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.013904833680136126, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0013152248622154829 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.009101109725055801, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.000849061484627802 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0017579778442265573, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00022272256203822104 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0034824583016457547, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004707745855497479 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0021173402290246453, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0002651969883574264 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.00606164612301448, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0005820824170547412 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010516775330575035, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0010286453150278683 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006671364196388791, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006155682683130244 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.0077547689033896795, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007519757597042171 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.013113865139552568, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0012437323588959986 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.00852403124177262, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.000789483822967171 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.0320053783861012e-06, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.6548309745966328e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..e7c24cddbe26caa90ce88e0e8b619779c8ed6db2 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 1.4456822172834254, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.04276533070237041 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.08084608817477075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0013037630358869862 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.16055476672730024, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0022564902307428436 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.10550747830492155, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001600046418184004 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.0180883910143694, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0006324971623061661 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.03352985411112681, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0011860257734223087 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.023111704860364103, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0008023451007582199 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.07897160421844947, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0012157586325601468 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.15704150708399545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0020880518954252106 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.10309579699961463, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014856345287328617 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.06566532991903784, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.00115593325264158 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.13043930012149813, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0020438483091751833 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.085687119444743, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0014326281774339593 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6f844c41d96b25bb9a50156847c483aeb9fa3a35 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 7.854550343569453, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.11842361375802873 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.35242925608961834, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0025862879156174677 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4593871286009479, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027718307444898073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.37960517377654424, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021312179107678742 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.15016846460595357, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0016925643088238768 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1987661075234813, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002085741403395336 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.16225548525605324, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001628980531143478 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2535878033618753, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0018603284522068176 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3373488751020238, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023042860742874356 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2751099734003478, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015986731793980245 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2947167761956799, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002321783937504011 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3850310566251188, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026364808102144186 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.31764028681903844, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020166639615139246 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..bbe4fac19a87868da52322f4f97aa2cac7de5f8b --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.584259500465588, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1544206935916045 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4101598697462684, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002246311055501821 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4603951235406536, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002736343584240638 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.41716631446436636, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001904443983975073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.1817762545465421, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017054003975476711 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20814546072005263, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021073018090344247 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.18592733733343356, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001651511887316203 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.29271400984628115, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0018520206075962242 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3307167069836982, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002352222065176941 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.29825905325627894, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016671912167031061 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.3438330605735075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0021559258341024025 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3863382687718853, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026264477519150294 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3497622641102556, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019222555310956092 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..260d37be7fd429f5ff70becbba772707fec69235 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.005027804713954, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14913713325107694 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4128283610854264, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00218582649540743 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4617654209580726, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027204559282358 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4199469764935773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001866102905923008 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.18554586275444523, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017040263392683272 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2117021500635163, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002152756842715476 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.18965165207657023, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0016611244058807987 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.29313420912472204, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0018337994526123047 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32931921594254, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023370831957328685 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.298413421066599, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016514441907895666 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.34697556096050464, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002097945215373547 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3888925774714783, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002615178055125266 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3531127839068146, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018773997153010787 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..1d8ec503ca86c211fc44aa13e0666ac77e5bcc87 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.363725115618854, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1349892134607558 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.41369428294464894, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0022630498681273214 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.463073205676912, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002620101280268744 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4214008037563902, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018957274669436463 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.18853767720104403, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017966301373649335 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21376292605494995, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021133996361269876 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19224882966800977, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001688941669379114 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2947773213194346, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0019453260402410404 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.33160719324501514, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023386028746102032 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.30045503720645306, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017243402211031724 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.34793871661300624, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0022022816802554548 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.38987225844490936, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025624343675698957 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35440044254437, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001939185206150459 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7623f66d2bcffbf8ef04cc71a1a71b48ab395e51 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.396192996497414, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.16654357094855035 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.415343404582103, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0022395714603746343 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.462339881403203, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002606515070610007 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.42256346127489886, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018711992463432423 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.18874947831873545, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017363983679664929 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21329100699058842, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020862831128997342 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.19258472578075223, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0016595774845375585 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.29366555957532514, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0018624351126946828 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32911404216108797, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023155754665530786 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.29935707532452077, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016828692465751755 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.34963846222070455, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0021787598409919178 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3890874281204962, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025265070175629857 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3555436949251867, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019127831146169912 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_0.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ebc78dd2d13887e37295c0c4b09d6796daaba6cc --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.15422621570346934, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0020039005936603317 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3506635490563916, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0042556493547655115 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20889878659689404, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002458161766680771 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03307990095257621, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0011002276404168225 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.07910944220650014, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026293603468150466 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04565942952067972, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001484562672483921 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.11490133308951496, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001481297426684668 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.26284399370938016, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033084414512192374 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.15587034501708355, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018431637093872144 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12158807333409381, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016089880194761488 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.278789316707468, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00364738944247525 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1651849748571103, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002039061494531475 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.8234981410881652, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09861688194525574 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_1.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..e0feff5eaa71eb736871e922ecca100411851bcf --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12978400090119854, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018214048412026733 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.32027413224988105, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00416743115408514 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.18254418171842912, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024443411491113813 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.025920284045820686, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009915583067368265 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.06631766447507839, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026016286386155744 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.036825241144522146, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014067669670603119 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09779168145477703, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013336831707437397 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.24393449987832236, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032690620169295624 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1379121041144307, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018159806506780998 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10419708360998835, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014908021891115058 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2591470200293115, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035902088886349626 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14685271867556554, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.00202786402481471 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4511145888771138, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09215852910549645 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_2.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8d74a38f56748e1608cd9c2409dbb3b880a85472 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12682893488466288, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018115124386976255 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3129238773710033, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004144317584991236 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1784133650153775, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002434527345664647 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.023792739813654398, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009538695469598671 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.060628286518002124, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002544171640335871 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03377646994942601, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013577113683580135 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09538132852222156, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0012844315555328582 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23736904076265325, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0031180197306729797 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13445676544883162, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001742983161792639 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10150079343006048, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014805542361053387 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.25224041568358746, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00356325287772434 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14302327166537732, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020121565752601223 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4173910716715976, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1269050055569669 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_3.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..d4ab48a07bf6245c9712a337f373606d802c7a1d --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12682835665999379, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.00213008962319155 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3009777871605996, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0045155564803296844 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17405000505151677, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0026158795444079694 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02441534481786468, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0010675183688113013 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.060023335309239284, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0025544641047680868 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03375564198727498, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0014032677780195426 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09672846502785581, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001605939754348312 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23129794905638065, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003504325859643222 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13287002402660542, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019574198182001363 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10242219504173285, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0017649678079630277 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2447872835150151, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0038950725453768833 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14072796227018858, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002188698179032325 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.4410854543220795, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11065939978206533 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_4.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..f7096663bf393eac8965c1a97f76e5cecf3be786 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.041064589753945765, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002574722440175742 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07375404829054749, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004261542973214119 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.046992144100321806, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002618786666967082 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0072827259137400735, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008839873299209189 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.01434569739075993, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0014362041655696376 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.008636963128827568, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0008391846215142884 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.03137075485796663, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0020006363883442293 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.05624031413634613, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032626943561910897 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.03548036137516894, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001955807555849124 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.03357423627999912, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0021310282339018806 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.059996937228044826, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003508594344969223 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03810619457684465, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0021359009016179383 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.6753547790268645, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09678811316166971 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_5.json b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..554c2c05cf5e0956921ae430aa5abace018ab9ff --- /dev/null +++ b/4b284b6bc4seed1/evaluation/generation/slim.4b284b6bc4seed1_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.002394598265414318, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0007029813930147865 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0019954716710551207, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0005584193559240988 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0021338767527660316, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.000606716788713842 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0001469327010392493, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 8.511648046715374e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00010241330996047977, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 5.9726635104036084e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00011901404509555748, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 6.872962972148577e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0017715789785566055, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0005103213321970242 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0015030111824248839, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0004165975224565321 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0015909130557671355, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0004446509241590643 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0020245246393824, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0006015169025391406 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0016826910638698292, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0004718028635824783 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.001799689332800904, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0005143272355042585 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 3.8720991740133824e-38, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 6.757775100349013e-33 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed1/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_0.csv b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..2edcf8a38c30c2916cd77efbb8a166f5bccdd401 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.337,0.014955087918653603,0 +anli_r2,acc,0.33,0.014876872027456734,0 +anli_r3,acc,0.3383333333333333,0.01366414400661827,0 +arc_challenge,acc,0.2721843003412969,0.013006600406423706,0 +arc_challenge,acc_norm,0.30119453924914674,0.013406741767847632,0 +arc_easy,acc,0.5774410774410774,0.01013597822298108,0 +arc_easy,acc_norm,0.5290404040404041,0.010242463826395614,0 +boolq,acc,0.6076452599388379,0.008539983838167734,1 +cb,acc,0.4642857142857143,0.06724777654937658,1 +cb,f1,0.26694444444444443,,1 +copa,acc,0.73,0.04461960433384741,0 +hellaswag,acc,0.46285600477992433,0.004975993795562032,0 +hellaswag,acc_norm,0.6013742282413862,0.004886147907627405,0 +piqa,acc,0.7437431991294886,0.010185787831565062,0 +piqa,acc_norm,0.749727965179543,0.010106561880089768,0 +rte,acc,0.5740072202166066,0.029764956741777645,0 +sciq,acc,0.818,0.012207580637662157,0 +sciq,acc_norm,0.737,0.013929286594259734,0 +storycloze_2016,acc,0.709246392303581,0.010501233625213081,0 +winogrande,acc,0.5816890292028414,0.013863669961195892,0 diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_0.json b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3c11c94676d59da51ba63addb31a58a1aaa5cf77 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.014955087918653603 + }, + "anli_r2": { + "acc": 0.33, + "acc_stderr": 0.014876872027456734 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.01366414400661827 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.06724777654937658, + "f1": 0.26694444444444443 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.04461960433384741 + }, + "hellaswag": { + "acc": 0.46285600477992433, + "acc_stderr": 0.004975993795562032, + "acc_norm": 0.6013742282413862, + "acc_norm_stderr": 0.004886147907627405 + }, + "rte": { + "acc": 0.5740072202166066, + "acc_stderr": 0.029764956741777645 + }, + "winogrande": { + "acc": 0.5816890292028414, + "acc_stderr": 0.013863669961195892 + }, + "storycloze_2016": { + "acc": 0.709246392303581, + "acc_stderr": 0.010501233625213081 + }, + "boolq": { + "acc": 0.6076452599388379, + "acc_stderr": 0.008539983838167734 + }, + "arc_easy": { + "acc": 0.5774410774410774, + "acc_stderr": 0.01013597822298108, + "acc_norm": 0.5290404040404041, + "acc_norm_stderr": 0.010242463826395614 + }, + "arc_challenge": { + "acc": 0.2721843003412969, + "acc_stderr": 0.013006600406423706, + "acc_norm": 0.30119453924914674, + "acc_norm_stderr": 0.013406741767847632 + }, + "sciq": { + "acc": 0.818, + "acc_stderr": 0.012207580637662157, + "acc_norm": 0.737, + "acc_norm_stderr": 0.013929286594259734 + }, + "piqa": { + "acc": 0.7437431991294886, + "acc_stderr": 0.010185787831565062, + "acc_norm": 0.749727965179543, + "acc_norm_stderr": 0.010106561880089768 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_1.csv b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..7fc9e6754e82ead91f80d3d759cf52988dfaaedd --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.348,0.015070604603768408,0 +anli_r2,acc,0.344,0.015029633724408948,0 +anli_r3,acc,0.3383333333333333,0.013664144006618271,0 +arc_challenge,acc,0.28924914675767915,0.013250012579393443,0 +arc_challenge,acc_norm,0.31313993174061433,0.01355267154362349,0 +arc_easy,acc,0.6043771043771043,0.010033741393430986,0 +arc_easy,acc_norm,0.5677609427609428,0.010165130379698746,0 +boolq,acc,0.6058103975535168,0.008546995661233635,1 +cb,acc,0.4107142857142857,0.0663363415035954,1 +cb,f1,0.21777777777777776,,1 +copa,acc,0.71,0.04560480215720684,0 +hellaswag,acc,0.46285600477992433,0.004975993795562031,0 +hellaswag,acc_norm,0.6014738099980084,0.004885942040894556,0 +piqa,acc,0.7388465723612623,0.01024873864993558,0 +piqa,acc_norm,0.7399347116430903,0.010234893249061282,0 +rte,acc,0.5415162454873647,0.029992535385373314,0 +sciq,acc,0.856,0.01110798754893915,0 +sciq,acc_norm,0.829,0.011912216456264614,0 +storycloze_2016,acc,0.694815606627472,0.010648664383985658,0 +winogrande,acc,0.5753749013417522,0.01389189315026423,0 diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_1.json b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_1.json new file mode 100644 index 0000000000000000000000000000000000000000..aa7d83c3bee2af83655e4d5168004dc9934e172d --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.348, + "acc_stderr": 0.015070604603768408 + }, + "anli_r2": { + "acc": 0.344, + "acc_stderr": 0.015029633724408948 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.013664144006618271 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.0663363415035954, + "f1": 0.21777777777777776 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.04560480215720684 + }, + "hellaswag": { + "acc": 0.46285600477992433, + "acc_stderr": 0.004975993795562031, + "acc_norm": 0.6014738099980084, + "acc_norm_stderr": 0.004885942040894556 + }, + "rte": { + "acc": 0.5415162454873647, + "acc_stderr": 0.029992535385373314 + }, + "winogrande": { + "acc": 0.5753749013417522, + "acc_stderr": 0.01389189315026423 + }, + "storycloze_2016": { + "acc": 0.694815606627472, + "acc_stderr": 0.010648664383985658 + }, + "boolq": { + "acc": 0.6058103975535168, + "acc_stderr": 0.008546995661233635 + }, + "arc_easy": { + "acc": 0.6043771043771043, + "acc_stderr": 0.010033741393430986, + "acc_norm": 0.5677609427609428, + "acc_norm_stderr": 0.010165130379698746 + }, + "arc_challenge": { + "acc": 0.28924914675767915, + "acc_stderr": 0.013250012579393443, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.01355267154362349 + }, + "sciq": { + "acc": 0.856, + "acc_stderr": 0.01110798754893915, + "acc_norm": 0.829, + "acc_norm_stderr": 0.011912216456264614 + }, + "piqa": { + "acc": 0.7388465723612623, + "acc_stderr": 0.01024873864993558, + "acc_norm": 0.7399347116430903, + "acc_norm_stderr": 0.010234893249061282 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_2.csv b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..85122fdf2efa7687922b8549a128e5f45933952e --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.322,0.014782913600996664,0 +anli_r2,acc,0.313,0.014671272822977892,0 +anli_r3,acc,0.3491666666666667,0.013767075395077249,0 +arc_challenge,acc,0.2832764505119454,0.013167478735134575,0 +arc_challenge,acc_norm,0.3165529010238908,0.013592431519068079,0 +arc_easy,acc,0.6022727272727273,0.010042861602178061,0 +arc_easy,acc_norm,0.5803872053872053,0.010126315840891539,0 +boolq,acc,0.6174311926605505,0.008500443818876165,1 +cb,acc,0.42857142857142855,0.06672848092813058,1 +cb,f1,0.2745098039215686,,1 +copa,acc,0.75,0.04351941398892446,0 +hellaswag,acc,0.4613622784305915,0.004974860878464439,0 +hellaswag,acc_norm,0.6013742282413862,0.004886147907627404,0 +piqa,acc,0.7475516866158868,0.01013566554736236,0 +piqa,acc_norm,0.7383025027203483,0.010255630772708229,0 +rte,acc,0.5487364620938628,0.029953149241808943,0 +sciq,acc,0.867,0.010743669132397332,0 +sciq,acc_norm,0.85,0.011297239823409296,0 +storycloze_2016,acc,0.7033671833244255,0.010562819181563226,0 +winogrande,acc,0.5509076558800315,0.013979459389140844,0 diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_2.json b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_2.json new file mode 100644 index 0000000000000000000000000000000000000000..80353083c23cdde17d0258959221e0046d76ec53 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.322, + "acc_stderr": 0.014782913600996664 + }, + "anli_r2": { + "acc": 0.313, + "acc_stderr": 0.014671272822977892 + }, + "anli_r3": { + "acc": 0.3491666666666667, + "acc_stderr": 0.013767075395077249 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.2745098039215686 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4613622784305915, + "acc_stderr": 0.004974860878464439, + "acc_norm": 0.6013742282413862, + "acc_norm_stderr": 0.004886147907627404 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808943 + }, + "winogrande": { + "acc": 0.5509076558800315, + "acc_stderr": 0.013979459389140844 + }, + "storycloze_2016": { + "acc": 0.7033671833244255, + "acc_stderr": 0.010562819181563226 + }, + "boolq": { + "acc": 0.6174311926605505, + "acc_stderr": 0.008500443818876165 + }, + "arc_easy": { + "acc": 0.6022727272727273, + "acc_stderr": 0.010042861602178061, + "acc_norm": 0.5803872053872053, + "acc_norm_stderr": 0.010126315840891539 + }, + "arc_challenge": { + "acc": 0.2832764505119454, + "acc_stderr": 0.013167478735134575, + "acc_norm": 0.3165529010238908, + "acc_norm_stderr": 0.013592431519068079 + }, + "sciq": { + "acc": 0.867, + "acc_stderr": 0.010743669132397332, + "acc_norm": 0.85, + "acc_norm_stderr": 0.011297239823409296 + }, + "piqa": { + "acc": 0.7475516866158868, + "acc_stderr": 0.01013566554736236, + "acc_norm": 0.7383025027203483, + "acc_norm_stderr": 0.010255630772708229 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_3.csv b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..653e1ad95661f8ceabc96be14ffd0fbfecc48a6a --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.32,0.014758652303574886,0 +anli_r2,acc,0.346,0.015050266127564443,0 +anli_r3,acc,0.35,0.013774667009018554,0 +arc_challenge,acc,0.2858361774744027,0.01320319608853737,0 +arc_challenge,acc_norm,0.3122866894197952,0.013542598541688065,0 +arc_easy,acc,0.5976430976430976,0.010062244711011518,0 +arc_easy,acc_norm,0.5913299663299664,0.010087174498762886,0 +boolq,acc,0.6238532110091743,0.008472516562330725,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.3130977130977131,,1 +copa,acc,0.77,0.04229525846816506,0 +hellaswag,acc,0.4643497311292571,0.004977081808179426,0 +hellaswag,acc_norm,0.603963353913563,0.004880726787988643,0 +piqa,acc,0.749183895538629,0.010113869547069044,0 +piqa,acc_norm,0.7453754080522307,0.010164432237060499,0 +rte,acc,0.5379061371841155,0.030009848912529117,0 +sciq,acc,0.866,0.01077776229836968,0 +sciq,acc_norm,0.859,0.011010914595992436,0 +storycloze_2016,acc,0.706574024585783,0.010529489334744466,0 +winogrande,acc,0.5659037095501184,0.013929882555694058,0 diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_3.json b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_3.json new file mode 100644 index 0000000000000000000000000000000000000000..23e9dcf8055a38fd46796a4ac849a5cbb89d09b2 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.32, + "acc_stderr": 0.014758652303574886 + }, + "anli_r2": { + "acc": 0.346, + "acc_stderr": 0.015050266127564443 + }, + "anli_r3": { + "acc": 0.35, + "acc_stderr": 0.013774667009018554 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.3130977130977131 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.4643497311292571, + "acc_stderr": 0.004977081808179426, + "acc_norm": 0.603963353913563, + "acc_norm_stderr": 0.004880726787988643 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529117 + }, + "winogrande": { + "acc": 0.5659037095501184, + "acc_stderr": 0.013929882555694058 + }, + "storycloze_2016": { + "acc": 0.706574024585783, + "acc_stderr": 0.010529489334744466 + }, + "boolq": { + "acc": 0.6238532110091743, + "acc_stderr": 0.008472516562330725 + }, + "arc_easy": { + "acc": 0.5976430976430976, + "acc_stderr": 0.010062244711011518, + "acc_norm": 0.5913299663299664, + "acc_norm_stderr": 0.010087174498762886 + }, + "arc_challenge": { + "acc": 0.2858361774744027, + "acc_stderr": 0.01320319608853737, + "acc_norm": 0.3122866894197952, + "acc_norm_stderr": 0.013542598541688065 + }, + "sciq": { + "acc": 0.866, + "acc_stderr": 0.01077776229836968, + "acc_norm": 0.859, + "acc_norm_stderr": 0.011010914595992436 + }, + "piqa": { + "acc": 0.749183895538629, + "acc_stderr": 0.010113869547069044, + "acc_norm": 0.7453754080522307, + "acc_norm_stderr": 0.010164432237060499 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_4.csv b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..68f6b4d3d734486c77889e2bb81fe076deead363 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.367,0.01524937846417175,0 +anli_r2,acc,0.325,0.014818724459095527,0 +anli_r3,acc,0.3425,0.013704669762934722,0 +arc_challenge,acc,0.28498293515358364,0.013191348179838795,0 +arc_challenge,acc_norm,0.3191126279863481,0.013621696119173304,0 +arc_easy,acc,0.6056397306397306,0.010028176038393007,0 +arc_easy,acc_norm,0.5812289562289562,0.010123487160167819,0 +boolq,acc,0.6192660550458715,0.008492625561656217,1 +cb,acc,0.42857142857142855,0.06672848092813058,1 +cb,f1,0.3487396784006953,,1 +copa,acc,0.71,0.04560480215720684,0 +hellaswag,acc,0.46265684126667994,0.004975845335086618,0 +hellaswag,acc_norm,0.6078470424218283,0.004872326888655505,0 +piqa,acc,0.7453754080522307,0.01016443223706048,0 +piqa,acc_norm,0.7453754080522307,0.010164432237060492,0 +rte,acc,0.5379061371841155,0.030009848912529117,0 +sciq,acc,0.865,0.010811655372416051,0 +sciq,acc_norm,0.851,0.01126614068463217,0 +storycloze_2016,acc,0.7113842864778194,0.010478311785642947,0 +winogrande,acc,0.5572217837411207,0.013960157350784985,0 diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_4.json b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_4.json new file mode 100644 index 0000000000000000000000000000000000000000..5960684bba06cba85944f0eb4498eb7191bf5f72 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.367, + "acc_stderr": 0.01524937846417175 + }, + "anli_r2": { + "acc": 0.325, + "acc_stderr": 0.014818724459095527 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934722 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.3487396784006953 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.04560480215720684 + }, + "hellaswag": { + "acc": 0.46265684126667994, + "acc_stderr": 0.004975845335086618, + "acc_norm": 0.6078470424218283, + "acc_norm_stderr": 0.004872326888655505 + }, + "rte": { + "acc": 0.5379061371841155, + "acc_stderr": 0.030009848912529117 + }, + "winogrande": { + "acc": 0.5572217837411207, + "acc_stderr": 0.013960157350784985 + }, + "storycloze_2016": { + "acc": 0.7113842864778194, + "acc_stderr": 0.010478311785642947 + }, + "boolq": { + "acc": 0.6192660550458715, + "acc_stderr": 0.008492625561656217 + }, + "arc_easy": { + "acc": 0.6056397306397306, + "acc_stderr": 0.010028176038393007, + "acc_norm": 0.5812289562289562, + "acc_norm_stderr": 0.010123487160167819 + }, + "arc_challenge": { + "acc": 0.28498293515358364, + "acc_stderr": 0.013191348179838795, + "acc_norm": 0.3191126279863481, + "acc_norm_stderr": 0.013621696119173304 + }, + "sciq": { + "acc": 0.865, + "acc_stderr": 0.010811655372416051, + "acc_norm": 0.851, + "acc_norm_stderr": 0.01126614068463217 + }, + "piqa": { + "acc": 0.7453754080522307, + "acc_stderr": 0.01016443223706048, + "acc_norm": 0.7453754080522307, + "acc_norm_stderr": 0.010164432237060492 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_5.csv b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..2830b88e231d4c18c6b7fa56bcde2fd70a2392ab --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.314,0.01468399195108795,0 +anli_r2,acc,0.337,0.014955087918653609,0 +anli_r3,acc,0.35,0.013774667009018558,0 +arc_challenge,acc,0.29180887372013653,0.013284525292403506,0 +arc_challenge,acc_norm,0.31313993174061433,0.013552671543623494,0 +arc_easy,acc,0.6043771043771043,0.010033741393430983,0 +arc_easy,acc_norm,0.5925925925925926,0.010082326627832861,0 +boolq,acc,0.617737003058104,0.008499149690449273,1 +cb,acc,0.42857142857142855,0.06672848092813057,1 +cb,f1,0.31174851513834567,,1 +copa,acc,0.75,0.04351941398892446,0 +hellaswag,acc,0.46395140410276836,0.004976796060456438,0 +hellaswag,acc_norm,0.6093407687711612,0.0048690101522807505,0 +piqa,acc,0.7453754080522307,0.01016443223706049,0 +piqa,acc_norm,0.7404787812840044,0.010227939888173923,0 +rte,acc,0.592057761732852,0.029581952519606197,0 +sciq,acc,0.876,0.010427498872343961,0 +sciq,acc_norm,0.871,0.010605256784796565,0 +storycloze_2016,acc,0.7044361304115446,0.010551778839373784,0 +winogrande,acc,0.5572217837411207,0.013960157350784978,0 diff --git a/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_5.json b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_5.json new file mode 100644 index 0000000000000000000000000000000000000000..9eaf685c074a64c7a3d5df36c812ca17d20c1d80 --- /dev/null +++ b/4b284b6bc4seed1/evaluation/rankeval/4b284b6bc4seed1_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.314, + "acc_stderr": 0.01468399195108795 + }, + "anli_r2": { + "acc": 0.337, + "acc_stderr": 0.014955087918653609 + }, + "anli_r3": { + "acc": 0.35, + "acc_stderr": 0.013774667009018558 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813057, + "f1": 0.31174851513834567 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.46395140410276836, + "acc_stderr": 0.004976796060456438, + "acc_norm": 0.6093407687711612, + "acc_norm_stderr": 0.0048690101522807505 + }, + "rte": { + "acc": 0.592057761732852, + "acc_stderr": 0.029581952519606197 + }, + "winogrande": { + "acc": 0.5572217837411207, + "acc_stderr": 0.013960157350784978 + }, + "storycloze_2016": { + "acc": 0.7044361304115446, + "acc_stderr": 0.010551778839373784 + }, + "boolq": { + "acc": 0.617737003058104, + "acc_stderr": 0.008499149690449273 + }, + "arc_easy": { + "acc": 0.6043771043771043, + "acc_stderr": 0.010033741393430983, + "acc_norm": 0.5925925925925926, + "acc_norm_stderr": 0.010082326627832861 + }, + "arc_challenge": { + "acc": 0.29180887372013653, + "acc_stderr": 0.013284525292403506, + "acc_norm": 0.31313993174061433, + "acc_norm_stderr": 0.013552671543623494 + }, + "sciq": { + "acc": 0.876, + "acc_stderr": 0.010427498872343961, + "acc_norm": 0.871, + "acc_norm_stderr": 0.010605256784796565 + }, + "piqa": { + "acc": 0.7453754080522307, + "acc_stderr": 0.01016443223706049, + "acc_norm": 0.7404787812840044, + "acc_norm_stderr": 0.010227939888173923 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..632975578bc12a91ba68a887557c61c31365b0a7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f41436dde8f7e13aa6cac6b2504b52d7bde93a3ce1cf02e70a12941ce69b6ba +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b4ad38811204b9215b76e77dd2339a6b284d14d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e414d5e5c47facda6a2f1c0bcb9dd11394fb94116eb1c3ae64b5754b31cd4067 +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acf4087424917f10e77123b65a3a11f9c0327b78 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2058bf47d8390c713e684752653b22a2d31937554d072b1e3e80bb55d3fe910a +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6bfa13bdb8403b596b5df7d4a5287a1b4c0c2a5e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6f06b495d630b3b5fe7b8750519cd5a81caef6d99437dcfcd478b2768071dee +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8483205b8ecdd510e3ceb6e6427884531c6769e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffc533278240f171207efd27a9b5667b25585df3d298052d4a87ee297a3dc4f7 +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca67ff880f76dafdbb071b5d18069e7666d0931d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb0227bd26ba55a841791e961c3b3b2fcd28a51a36eea751d95f0a18e250c85d +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab2ec245c5a0474a19fe38df9b29d63ccd358244 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5ed4c5d143073a41e26133d8c96b21dd157e53381d0d7d1cb25e5c7392d5ffe +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..997c838292e96db46c8e88a521f5ed88f20c7df8 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d666f90b53266d72504a5dd7b94640a558eb1336f5e79fc3b300e265b65907d8 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f55d266854fda3cfe8578aef23b8e185f2581f62 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3fa6a5f0ae399ce55632a51b6d58af96412b4a18236c8862091bee36b84bffaf +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..836f797101d929c4de9a6754024a1d6e4981adb6 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0e5531a5736186a5840892ddbc02a30ed5fdc41b846f528be1d6921151c5815 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4557bfd05bd513b52c88ec81bb28c25d6f159edd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f597f76c1126e255962e06c2b714eae0f59e6ed4efbd5cff288a0d50c1bc68e +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9b0039f48336f7f65182347bb3a54441a04bbe8e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10ffca4c8b0e2047207d4fbc54adc32c9f6c48e5b7235cbabd3e326be94b702f +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48e4545a07b5234e54c2f90fe2b5ac58fc8d1a29 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aec59eb9c16e697111ba1403e459271442dae1162bbef333af726a947c0f3e3a +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cefaa96ca2763f99008ce272f9f31509e586f6ab --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b53141884c85d9386e5da4f9679cfb2b9dd47b5f72cdc713506b43af7183162 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e60da2681205e0e51d860d8f378433d882dec4aa --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73363cb314f67d54153a003f998f89e24063beaba9f831393f2996e046f1eea1 +size 199058669 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b55702306d5280ca1a2854795387832f126a2319 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee56d96db9fcd8c61262e369d3e1bb9062434b26700d62da283a57e3e83045f7 +size 199058669 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65ffaa68619573cfb6f7125b128c874dafe510b5 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e07b38ae401e8ddd6b6d2c14985c4f023fac657f969b70253b48ed75ee12bb79 +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5984e2958fc1bc21b9afe73d5059bab7ae54bf55 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6610fe1a5579c00929f9f94e7b523a9cfc54a553efaf40f17cfa12ede2684e2 +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..143281cd6811f8b52cd12d1b55097ce5761b00b3 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e5c172fc7a8f5759117d1c671f2b2b50e6ed3267976669a53c7b456209acae86 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3c6b3e73414a12b1b6c9e702a16b177a845fecd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4a3f702c70dc8299ebb49cbdf5fc912a9d9c2b759e60df6042272828d124df4 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b72e5f5c116b0d081a274bef777fe6a1ebbf6813 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e20e0daf9d0b69bfa978636f7e619f34d576ef52e6761293f752a48b16a7d0 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cddb870db17414da00049553eefcbadf0f41fc1b --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:701c5431d73fb885477d2a7124b73417f9dd75689b3a4e9bfb35add272b2db16 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cdbc690a66dab072e83b6b1481b12cc3c13b6496 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f02ba11ea4806028007cc3f911f46013c66c78d22b94f9efce3d39174157f20 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e87573a5c86f31732cd10ccd148fbad6eb0b001 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49805e844db99592ecbe51df960c49ec1f8fff89f6ea48fa6c9ad12490c4793f +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fcba8a76258a65de2efe4bb44fff72624b7f3889 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24f48d6aae2ee809dce6b501312c7f22746014e8af48a0f74c05fe287c556bea +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a90ed85bd8c8b555a2bcfe3d8a9d7063c7f40059 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45eb0a89a4be1cf342137c9b5870985786103a0f1ae19f217195ff347bab8220 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6f75daf47374da3e1babc93a3c96e3d376c9c90 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6695b056922c97ef438e0d36f105ae12b15c8f58ac8f21eb4416d444ff0ef8f6 +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe4117f1f014b17bb05e1337dad73181b23b5e16 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:adfb88332e75304f5b9c52ec54f69d4dd57b22ecf609362bb78d7cddf3306ad4 +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2809cb15a58d507fe6ce0e5948e3c9470466516f --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3f04e0624495ec5bda2895b4e9f7abf88da8d58783f310a81f637b3c65134b4 +size 199058605 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9df20d6bc75f3209f035d1ce7ec5906881865c68 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34953359fb220c57650a4d7594177b26246d3b9e00aab93626e96681d06f2e2b +size 199058605 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90c1634a9d37b8b61b03441b6dfb9f748bcd22dc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6110e4965468a5204028df5ea953e58c63389a5a50e9bc60c0740e2af69529ce +size 199058669 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9651cecbdebdba54e601f5a13272544377b4baa7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:585df29f7b162aee7dcf33f69649330b22da69bd6c45f2755947d66752c723af +size 199058669 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae3887240412ba1c0e9566e520881c2a0056d7c1 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3591e198e2306bf53f01b63d447fe350ca1e3aaf23f8f62d2281a87ccdbea828 +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d6f9b66169b632d8799dc21b6685d53848d500e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d2e61d81cfa92e75eae70bd87c4d08d5b1cce09ff2600f527e823314a3a64c1 +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad62f61eaf0646939c7bc53f00d0e0bb41cb3c8a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15bb43df194e818731cfeab1932e350f4c06a91756e7c9a6a902f3943d011b84 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94b7ec7a652a1576e074c04ee6d8c2883b3163d4 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77ca78767dd3474bd0158d8cb079b8f75e3b481bfacf70188cd19b87a727eab6 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64070a860bbac91fac5a5377083ed3ef732d383b --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1b25db728a30be5b81b0e3c3c99d6421bfe4bc87901ece30023d42ed0387be1 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e3994a7e3e6a1ef182b368dfc5762e5e0d18074 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d16047af33fb0eeb1e87917c6314236814a012edd96bada49cf9e09459e67024 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a8081595239e7dba84e981f3ce06834e2ed986d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fda0d820a238f06befb39728048645dee13d1bd4af938c12032120736e403b59 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c50a14cc2fd35b9e9ffea9eff0966bf1ef47193 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da65d46d5545ec2c9b11fa94e08e7ccf09f292d74c613756620d044aa168b05f +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7b284d2a21411d535c23d100d7b0e0851583fb9 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:429027a4071607e29ae0b305bafdf5fdadb1d9c45862796429452241c05d2e40 +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6198f7caebe21a02d8cac3ede9a015b1d5d5a107 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738e80da5c3c315f160e033118e893af12323bfcd5584efbf5e3b4bf61a14b7f +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a082278f831625867a5ea4de47fa4df643452b49 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08273455c119eb5221c8fdc924b935d4071e95aaa0766e15e273ce3f6df65938 +size 199058669 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5377e7cce492f8954a98bfc81a177ef0f4776645 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a4d258c36b0fcf8ba348093e1fdd7cd2106b48f4b1773bdeff616139e0a971cd +size 199058669 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca5ca3bb0728b22002384806fe73b63638fabe6b --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e3d2f52f264e520170d3ffb617f0d27aee1c92540ca7b69b30dbe9c2acae064 +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a1afedef81c0dca40019eac61f59a1090b2a8f4 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56fe8f6e5f747faf2afeeb5be4e63a630c20ab7eb71e72a00c4bd491878af268 +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e18546e7a5e08195d48f0a425c491617063cbfc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f88f0c42573f4b0cc9b58e4e12ba187a7bd9ef0e7d19af7b859d1dfc58594bae +size 199058669 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..878dd8de496770e78b89469b7f5917252bbc2c8f --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e03b73e41ebac87bd40e4aafd6704fac57b10e98918c60eb69e6af2daebe55a +size 199058669 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..acd60eeb312e80714f77bc3556c8a47409990969 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738791a68b4a7baf3d6d86c67cc250a7739609d5a7b73617f29d6783a2ff2529 +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b201deb941a4e957f303e2d64f2f0ea467cbbf5f --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92b2c61c898702e22d464da6317e3312eff7e211c447b60f740e891dfb8109ac +size 199058797 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3cd7d9c7179eb7f06805faa6d3b3653b47fb12e7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e58401bc872e0d787ab18c8767a15e0302d37d1925b3e9db3b551f4163e59ef4 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a9429963d00a00ed59a9a942e5398bfb245e5cf --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2558cc3e4b530f3324e6db7f8ccb56745b79cc575e711db0683ab874a46c3904 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..203d030987a3ed9ac6b61c2bc70648c009b9ffea --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9880e173351497771042ced11692b6abfcd978f6b5f0be7d11678887453e7f4 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c28b712c9c88a489ca3427d85a179a898fc6b056 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cf1590626663f358eb4871598888c7e477c86a20ffca7aa0d78c2bc22f74748 +size 199058733 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e779c570e8112976e456270d2565999cbda840c8 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37dac8d90fae372153f138e878894fded3c6e74550f4242523494ad55bbaf840 +size 199058669 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d99e8b03d68ea091ae88bf52d584510354f42d6 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e01f0e767fc8e19e679d3802ec25e8f0c323d7f682af62253028f8802c3bee59 +size 199058669 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a7de11767f93c9205c5bc75c2d81445fb02753b --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f56a7ceb36f7d010e8378e7f6704dcf2aecbaddb3febd57ba73556bc48a25edf +size 199058925 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38520adce52064a350acd56d02d1eb908182e20b --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65dcb396bc29675f688fb3f7ab57cddc966970e2d6f8f8007172f6bb89882a9a +size 199058925 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..be559bd403448d63953265423a5770dbea347c13 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:400d608cd9e88c4e027bd8879811f040b5238b73b51034dfd5b2a6e29054bd1d +size 199058605 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..657544ad12edbab09b40c40de321ec58444a1e25 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdbf89018e51beb3d0279f3395f41b5c8bbaced8f143522fbabe31e0f34ee248 +size 199058605 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d87d7c0d40e65c5bd0f57156106aa90a0bf3a4e2 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61a8c1820c7e44fca9f935b8fc97edc5b4134175e6393a711c56d02e095c1883 +size 199058605 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce714d71b0b7d92359fb2f99b3fb93fa194cdb29 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:664870285b31503fe51e68a7a942c462d4108bd4085a0385afb521724edc7c88 +size 199058605 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2320e5df8dd0239d388d8cc2e8bac8a30e24d62 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b620f8569f84ab07a54a95d0e9eef6b88217fb6bd1ffcc7b7e1967045c2d7c1c +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33c05f7753b8605bfdc9ce05e5988542970b9e1d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ccffc0845acbc4e3343a156e277eb64b54a22a4f0dddd2d2097ee9d9b2d9fea +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1d5d67b7cc91c6ef695d944d880e20261f2d31d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd72ac8ce6a70282585ae1d98c7016af0dae4283376c4b5bc9fdc5361a010781 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed0de01b9de681acc59a8201e50b849042f01681 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9123b434bfd38fc348194d83ad75f1ced6ed8b7b0e795e3be09b85d6d94dd321 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b5b8214833ea20ec017512ab9177e10eab20910 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1207e28e3120b8d00e1638c92b53c9b8009f4dbc59ef10291f39492f9b2a730 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7dde7f9dc83aff76a265aaec4b97c3bebdf345c --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8454d013221e76cf72a6703e0ccaf576e48c03dfd9ebcfc0289858ccf3bbf4e3 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57647d757b2c152d52a3255a31e5b7f29e2b98dc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d751a63bfcb9454a6ec2d3b6aa3aedb1d2bb7a5e4cbc085e3ab1ce83e0f34b2 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1de8d78738ddcd3d22955a9b950a94551a006c3 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c2d221da61aa8e3880e0a3846e00d3affe16b2c637715e4cadcb11291bcb2be +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d70e503302e3e82b5ae325cab0d0e2e6c6e2aedc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e59804621b90199f9113a2ffe5e86623fbc78aa7b6db63d690fadbf713420724 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4740baeae431854f9d7d8afc44a872dccfc4c222 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec1d7d251ce02c892d9fe5f0386dc28774b53053689cb4b29b5dd18b1d99be37 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d45afe0d237b34b4fbf229464ea914d576512c5 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b208291372797cc446b8e298822deaeb6c1107597bec9333bbf1e2e3c4a56fc +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fcc0b52f36ca8c9f2f132fb5e86f969e03383fa --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02a7ebb48b0740da1ef9fb1c866cf5ba183a30cac6518911012e09faa4a2d3e +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c988797e9bfd3eb4a390ff80e39ff4f2d5c7bf9 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f679f4ae9765f59e0a269b344ef2eec2955ca6e9a5aa6ab34cecd17f47afdb9 +size 199058978 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b155c223ae8636cf0374a1a72bb1e97bd3a64c77 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6755508e11aedec43cab695492d2a103d065f1bab014aaaed14b1624402de07 +size 199058978 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..987f9f62ce48af024766d98a6675bc2ea8df86a7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b1f606be3a31863b4782694ede945f248878c60ab29b5ff74a4f39baa094f24 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d194855e95feb245e3867d7830ceb742853ac06 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:773174e60fe9bd1011c0a20a2c618a36e36b09c90b22ccee257400a62d69719f +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e4b3db4d19428dbb12c99c58d9f8e8c65a41580 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cad85c5f6a3aa8563fa3352a59e99946b714fa3b369a140e2114a8f2d085dfa +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25b62aeac1f872dc513ff57c8f7ccc9e7b34a380 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7cc466ed2d80ed1d9292b4ba8dcfb764dd485ec549e21f84bae63982a1efb26 +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d92a22dafab4863058dedccdacd0a8d7956558a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c612e2617d48bb51373e8ceacb33ed406339bc66f5ee583716425a4d1b6d604 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed47c96160295ed808b92aea1450e22bfe966403 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3c49eba08a6b07870fed3a69060622c25114ccdf1891457fe12674122903310 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b939b5729ce25161a1d2f7cf562b989162b56da --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9ddc8f2ec6fc0a759ec284f3cfdf4b9f05a8eed2ff25440a95705dbe6376d71 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f3e84139640624c0195c3ac2557c0dcb23c3f5c --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a772d4e9b0f61cd964a5ccc525eec4b6dad043a12596db821d8dbb5f000793bb +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dd0ca5735af46084f14e3cee0c4a63ac3eaa6cb --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce1eda6abd5167209272c1ac00933a8c89e0c699f9cecb37a2a96b349bf3ec17 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b0885d27ab84fdebcd6130661e8cca4135a01b3 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c48d964c8991ae99748ae0a59aaa2a83b9d41328ca2a93a8a3214ce50990eaa2 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c71eb0b0175062571124b4d8fde3612fd922c194 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3f63233212b1013b9209c11c3212e22e81ab5e98eea99e94e45d10215effdb7 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79f592b5f05b47a314d1551927d54de787a5e86d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:476786cdfa73499aebf649ad86c6916df83c21b75276e921112d2ef55a30cb8b +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..129dba49d2e60f518d5d401c92963dae52ac7287 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebea0c648eae5b43e3742e90a1fbdf365b504b38dd9d97b9836c2bcb534d9315 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5689b3e86dd1d8cbb3a4ef4dbe8e74d8c847c4ef --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3c51897cac8198c9a1f49e0d169a3f09d0235fc53b9366dc1341f5347e6b36 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2eb2ec32185531dd63f70207ae38b9ee31222621 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4f311d3e22bdc26b87a4f02079c6e719b2afa69f4cc13d9ec61ad4399911ab2 +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f13811d0aed6493a921f4c30c0d3f3c26ef92e84 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:450ea42dbdf4ecf8133b088af6918123b4a7b538ff32b53858a6032b9ebc894b +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f14a6df055a5d2295bac8fd54b9dcccafd144a3 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:358f5e35ea9397dd20ab26144bbe37ae28f912c40af955e30e1f2aee1180bdc0 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..316c370fd4b9cc366a05e9fc2af3d88a4fc4de4e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d8cce760b236877a423c4a67c3172a2827c087d436910749b4f89d5699e0bf1 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca2c624df42228434558ca41565e9242977f6b81 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76f362eff352969dcb4b0350da98b9cd5520b7ae822ce1c3d19c56f1e2f0151a +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3cba2fca57901103e00b110c075680f60d5f345 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2309be5e0f0fef4c1bc87d0f7bea1f8f554058cd9b7a5550f863db99f18a737 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a266080df96a14018cb72596d7ee74f08630dbc4 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:772b688b3cf91e4227d0655ba94965081cec95fa38718404c3195d20e14d15b1 +size 199058594 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..612fbd3110b3419094219151652d211156436bbc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af40cc800cc873cba1b8d23af357bec85d10f9530d3c41ef41b14ca4e2cbb177 +size 199058594 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1708b9b9c5433f482a5c1b2b47af794c3b43db0c --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:970aa80572414da8ac1b1c43a355b9799526cbf0f0ee4e907923cf0ab3fc6d2e +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cc85774cece6345bd146e6327ea9a0587b27983 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d441bbb9ee687f06ae19fbc4b9762c6f635b42a9a4b548b8d566eeb843471ca +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7dc0d63751fffde0a8e9bcb11321b1e7d235e4e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:539f0ddc4c3c5b21669448c754440b4396759a4bbb6cfd5c78eb74e49493fdd5 +size 199058711 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f817c2d572807d865a0e7e436a13e5301680945 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e7274f39f52402ecad4b7b7b56475378aa73e2e2d77b35edb4d7095947d5bfd +size 199058711 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f62109ace641db81a2f003cd1ee9bb978eb916e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8064659ac525df2cc5ed6238fafe4b54a387ba2114b3bb38eba943824817ae74 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce64dfd1e9362da0c48c9c09eceaa2a65a1f2cdd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35fce601eb29b4713b28f4e60497fc480e6c6884e7ba14661b577e1aa548ace9 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42077273725e958b131baaec3a4c787008c22136 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1b30dfb83d10e25a3c0b5131715991152a06ab56504d44d714bc369c5c2491e +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a9bfcba5508bf89e44938abb76dda64b87199ac --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46d9d5dfd2b9a35b1840cc718f9e0fe7562f9cd95af0fedfe341405f01cbbe30 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..996cd33e738fba628a8f0d5f2da21f2c989c833b --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31544e1c9b25b2833082ce1ed5340e18dfd3d47c400d9924cfef6e785325aa85 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9698294156e3e96b15d84f69b3acebd645c2677 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8239d211ace926dd33a0db79fd485b554a46ac23d2438a7943e93d93a064670d +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1392d31f1dd5c50b1f8f6a4ce3520188b3967088 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32da333edeece478bf0f6d17b54293fc53a952594daf32a3683b848023e3cd08 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff34de239b1805847d0da58aecfa3e90197dee5c --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed4ee21fc3583fbbf083f2327af7de057b45673b0ad39e5a1fbcd5fc18642c75 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..adcf96e6abd0e49ed0830ac44828859ee28f1ddc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:becf85fb5d8d8864e796653cef0add661e8146140d49e59094871e30c2591323 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..707c7fe6f79784f8d9c3db137651b7f1b532782a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fca130a1bf8b97a2f7f24ed1ecaf42111898c7ed3aa33e8218fbe1b03f21d641 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..967408eada41698788ce8ecae703a94d0b862b6f --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b99b5f7a691f2830b4d946a5b2436aaddce755c014b9051d6852e9ad9b862479 +size 199058594 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5509bb95f05fede4853654d19290afc858488d31 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0102b8986f63e2ccc3c5ed16890fdd081a71b3a14d1c0fece9ddc47c8baa78f4 +size 199058594 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef5e73da375867c77135e4e1cc177ed478010431 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d7ee17d6b6117573bc184fa8bb76a5d855da5f14d2fd6471fd207a90ab14898 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7c0b489092c47d1888d0211f81ecc8aaa7b40572 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0803364b1e9737c933c7dc3fd70718099843e54427979c98152439689798cc30 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f74162e935d6a856bf9c4b4b27e020075a34dbe --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74058fe040bd0766166476c4fd45a690fc026e36fb8e39388573850acf3c7606 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34b1028143fa706900aed41eca4bd467b8077f18 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ae4edc8ce65e1b4bb38e9ac7a7a79474198546a4c1ec1f0784a5be98b419661 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1e9f447b7000df273e103d3ae96b677bef8e7a3 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9058793fbeab1542c04690a1d9b01a03f56649668f78234cb7af013b7be20080 +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb7f4a4ce96668967ef8af34c4b5d24daaca0071 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050443e42c8354a8798e1068cda7b55dd264f006aae8a9ad073c5d0f3f9a063d +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cba303012ac58d9f5a73853486bee8025b3d21dd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98d89664429ce3d924f3dfbc3e7329ae34f363496c69e1faa56fb67a1f6e3da7 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ea31c468f837f66b77d955d2dd4ef90243a651f --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:174b70ac54f0f40eb5faa06e8b447ba87411815206edbeae3ce4bd58c6e78e92 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28c01b92d9b155739c0fb7e03300b053f8e8454d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c90addbb5af43f3c0d2cbc64a4e7ee04dbe6eda9171d11703695652e74b8986 +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38cfd8179e9be8bfac68374ba391a20d2cdcc849 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2164ccde2a9fe5291ce94e113db78ce1e19b8086fb37d19dae941094ddf10d4b +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61ed216c1fe860af0a62b2d5fa516559ee8eabfd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c4da2fe27b0e30c45bc6e0a13ee4be8b9cad54a5fc5a3ffac148b99eb5b9072 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..697b6b2def169851ab82205d0f02abdbd08ec9dc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63433a52ea24d2569aac931281cbf30e56ecf92e4c8ae4ad785fe6f0f65d75ed +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5af987964eb39145c0e00ce077af5faddcb5cf4a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b324bb32853011839e15a6e73837b91970027b7bb25335fdf6a5edf02126a5b2 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7e6031cd9081797f11187dbd993e855f4fb5951 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b456a1fb8fc7391321bf4e39c09a5d95b480c841ba91ae3c5ba63564aca4e021 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19a0ccd955353a7d2ae864a5b508bfe263060351 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c46563675e9d5741027f0faa56d5c49cc3a5dc7219388595b56774661cdd1e85 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7c78864e439b35c47c1335ef10ab141d67f49f0 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1087ebc7602be82040f5d0d9f99ae3f78c27a57df3b544b9deb560276c4d16e8 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a47df4e3da5b65aeb0f895edbb00df08309bee3 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49d5d7e821ee3386c740b97a57dc43b373880a1fb77e65fbee1e00c65f184dbf +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d36d28f491ca94e062e0fac7fa7a1073983e49d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c2a851cb9e1d51ba39c5254a5046bcbf2016aa4b1ae3c8bee734e385c8e8e9f +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8affe14675008e30a591a0ec60d2ad614036314f --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac36f01cbe2567cf7ead3e81668b433f5bf3fb2f09b55b6d6e41770815cd055 +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..773655ac62119aa31b98950f223b5282112de369 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38093ff9f5324e34e8145179f21001e764fa3d1a12c737ada5551b4ed68b73d7 +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17df0f83a45dfc200659cd20b77b339bdf90e167 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a151180e5b4256c656d01bf150d73b8de45ffb2acd2ac0028f31adf16a03246a +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20afc0cc986722e3b27c69bcd7b96d70e04e7844 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2ab81999fa763e077d879a27a0f9409fb86698faecb24701032487330f9988a +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90dc12394e0e09e21afd7eee8d57540c8e5f5d14 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16080e34a5a48d488c89197ed84e5404772f4b46813f60503f09d8c0168b2046 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..258e629c302748fc8a5a1a17d445dbb3def6865a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f706c1214f249c60319d6b8ff9d6f6324f5058387c5e786fb4409ffa83a8a5 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f43a9426860f478ecf7bf852c4183e8f22ca0c95 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27446a373a2686e0812e76661c4cf84ccf44311bfdf8b5fb9b1646f82728e12d +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b76a4972a237fbe39bc6cae44a3ea727e43ac201 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c6e49fa6029648de686e896c0b221088f5dbc804ed09f54056cbb7e2428df55 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd8441ab3efa00398845cbfc6246aebeec357dd8 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ca1f8396ce1e423281ac58e316a97ef65bbcf113ba57f8fdb1727570a686ce6 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dff012993bbaa6473788bc1db6151e9342e42b54 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6962708b0ab2ee8875f18f77d6c7f6e6465cdd46f1d483b388dd213d7ea94ffb +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb5b0a8ff98442beb30a824a148a5d53a7499b4c --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:657a0770155653262fefc6ca384f299b94f4f67809f245322cbb1f367319c1a3 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc0f73f2b3184756cc6e0cd67949fd45f1e06a90 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2175cf43cbac2c7666343bcc485644de072f90a2915e9398319a3fc4fd9fc23 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb99e5ee4146bf87c5bf772e68805d4aef0a6c88 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6f3da94840b4285e01fe5cf6ceb2b52bcee2a0e6be48c3b25f4feb1785156fc +size 199058775 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c61851cacb3ae3dbf875e787c55db139a34e3d38 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e6299f0c6230de44f5cacdc2511bf2163296b344351c98bd7770e894fcf43a +size 199058775 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c912426f223d3415ddd6e7c2fcea6ced9507d7bc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1340fd933d2659b88dec65417f5f4326a7641f1c7dc5ab8a6c9a5e68553ae960 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..126df37c358bfd3b620514184711ed6e1d8e6bf8 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d34d1f913cd00a9e332c942cc5ac51dcffcab4e079a6c187b8a177ef3c9c382 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5dd8f338ee07166905a45b77a7a7164b76996a71 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79e3ed2ee01b7462cc3e0998b6f6b463c2c4a5f5cc281ea159e7bdbd43394a4b +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..53947a8b62363a59a802275791cb9c1593d7cafd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9d4ff3f93dc4131e75b30be8a1f260f459b9f614d403b1d3bc64f161fdb9d0b +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ada7b082bc2c4cbfdac8cb7f7fba8a955c66bca5 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d291b33094b9fbae8513faf0191e7be73c8fb2726ff1fc93d04416a78e1ab32d +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c229bd8882e9efae77a7a997f6d8e5dfdc8acd7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:14b496a32b7e92d6b44f48fdac0262d2c77b9c143ebf5b20fc1095b97c79f96e +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c29e80b7b7433b4bcde39ad8d46db1abc9ee46e7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84a8abd5c39a992ce64e36984b5e5234f628f47d727ff8b758744034ff71b27d +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1ff6dcc3b4fe08061eeb26f267d932a18a9e905 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9d2f2b4d6e6eb8856d26524e3baa0b01156eafd71061857076137adf049da77 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a5c65e1017ffe3f0c822bf73d67d049a1af29b7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:beab3a61b090f4f58dd8040317362c1c0ea41c89de2cf463f91748899033c006 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbab7a52db9cc80872dd9ca52f45a8111feba353 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d714b14768e01d9896b8352620251fdc52745dd9df5e9a36d2a39e43c5284c41 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d6688da20ac12e91c1fd3d0b07a0a7e1c5e6557 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:500c482be69f8e1c0d274455876eecfe555b519e5ce6a91a5a28d1fcb733e5ac +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da57f3e2ef19f36c3e5c589cefa98639fc87661d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5bacee112ab062d05a67685f1434e8b4fb1661f39cca86392bb92f26c8a7b1c +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..644c1aaa64486eaa4e149c89b263a5b0d1dfde8c --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:340655d894b0523df029fe8fbc9fd126b56bc64708f072c299752fe393fb32d5 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b3667b18a2beb92beecd55faa032214602e65c9 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41210aa8d71b8b03f33566cbe403a76376080704ed0b2d8e509dfa996a39d653 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..84070c84d63ca8da47bd6304feff9c59e911f1b1 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f1696437c186b6f3eef8bf0eaa281d62bd10c14776188f7fd7fc14ee421b703 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b248c71c57c6c5d88bb3619ee3a6b7ae244f791d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3496b550407ac766b5eabeafda53a770e9ceae6231805f2d5965cb3af304e7c3 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f4140b7677cd633539e05f4e832a53a870a6f85 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e83c31c0df9c9ebea0939999f0df6ec12a8f0c6c6c0bf39adbb383c44f80fef +size 199058914 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa755981c320c2dcea7d7787815717c724016f3d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c6f14c243dc3e254dc83d0e25ae8135eae98705896166de9235092030ce7be9 +size 199058914 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0bd1d71ea231ecce6548dfd6fb35add1970d26d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d1a8211e01346f6abd2a8f93c6245fd2bbb3124e6e3ee501297362fa757b647b +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f44f991baf569dbeed37ca4de5863b420626d794 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:488d0154080fef6f86d1e8ebaa979846664a9e76689bfd6a33c8c37cef24a8c4 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2714bc72f973098579d32fa8e272bbd4eb9d7c3 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6791b7e2634cc967d38b89d8faa1ac09edec1f0354b98e506a5999f7005773a3 +size 199058711 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbe59b83cf1c3e60bc3d7337f512da446a4e5ebb --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:305865e02c42808bd8b057ab08723cf26ee190e4e2b501ba696c6ef89a34aa14 +size 199058711 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8635177e0c12749655cd6fc20bdd10e330cac372 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42bd521cbf4d158e690bdf80585b285047eff812214f815d7130463498c8b376 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f964768b158e0274c0f39f4fb44f54a610313d8 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9963e2b24e4e0e9dad4558f033255f7480549bc29d46dad7912626c6101a2fc +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94f51f6169fab3bc64c014fd5823853b2099cabd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a34acd7d1ddd87ffb11db3312e20a461f075170bc28704ad10aa11a6adae7f1 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f2ddf0627f9d2a412ef33b6b8da58249dcffebc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61c10c867c00f52a9bde09c31096b1798acca6b8275b236610c973a5ecdffeda +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ead8914aa8edc702e06d9fab88b596ede0d715c --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81210742586f0a0a644a91db61afb3d5c9910cf05d4a3059c708380a919ffa83 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a05f8a8084e4b950261046f563b0c168944782d7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df4a05d01fd519269b3e014a532829743296a64cf7a8fac0f4dcee328b16e600 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62b2fef53ffab622e330339463b39bd044b14d4a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:920e5b911f9e3c894054627cd06d2f795bfe51d2e1bc85bdd687919d5d956ec0 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c4d945dbd3e3e09f60f93df3baa4451f5f22d95 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:147f77eb7debaf85389d0d24b82bc4c50e94fbffcf0b5b8ba45155fac66c614d +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26320d1ef3e324e10cacb276c6af36838b1d8e6d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7a12d94f5e38a358938e642cac2474cfff4f86d64e2325694b6510e7f78687f +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93c713cd67496419b2050c479301167e115511d6 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e3a16aaf3147b542fcca46dc7abbfffeef64bbf46f2848c5f2720b0b89dfea0 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a0c9cc18c6b1f22734b481d1fb676a46d675c49 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7229ec62ff787908b59b889b7569ac73d6a750122d8f2f831de9bf607841fe3 +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61bc9a3e4c98894255fcefc356a2fe742e060ecb --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d0b26dcc1634c407c2b5d616219ae38d39645de85a94469d293aa163dc30f21 +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2668339b82fda21c9a3f9aaae9585c120e9d81b6 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa71d2bab115878c0ffeb67d2843c465859015a4bec35d4ccac9f71557687e3d +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2ee928cfdd0ca0795384a1241a06dbaf6500900 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13a11e62922772b1f825f941127426f0f966df357f4d5957e536897993b66faf +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5fa6955acd887bf7f9d75302e153da861e771d2a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a8140b12a800428745770b59a23aa602f162b7fa00dba8e1cb39a9032513753 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d5483104f18b62087137bc26ecc297d5a19bc05 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be9af1edab886052439570ec877783897844117b593668ed6e0af7ec8ecaf4ff +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87de55eab31d8176aa1c441be7bbac9b3e539d05 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122d4f2a9a5b6ee41f07d2345bfac495a8a1487e345b0e267cc73ed3f1ce53a7 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82101cf01838578d11010b97f9d4800f4d088a01 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdda439f72aa0e55091f8fe971bab4337c16aa61f15129e9f9a7c76f02b16f9d +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cce9cc18ecfc8807516a54c85cb4682a89e4214 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa8acadf8a7dcde1b9c9b24efd778154fb9f24df589e155158a88e8205bd9ec1 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1434ecbb818b4215e8194bc8d9bec8034f9888e7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd74ec0760ba80efefbb156cbce57a01bdd3694a952dbddcade73ded62218f69 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a07c5311263b71d86459692bb3a3ae19a91844f --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcbc2f9291074316a6dcf365629fea588c7287083f868ae5509698da7f5f0af8 +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f95e3157cf6d89784d1b29543929c04b5e1270e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba79e581daf3f85bd20da1eb0dcd1bf6503ae2a46de384e9bde5549ab488d5d6 +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8493e27263297960194a28b0b40eb1bc90a53cd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff39e8a142d662d15a023eeacda813ab57e91e802d7819d6e8e2693a5d7b130a +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc4416b29aa523a77fbfebfbb6ce8f25f58bda4b --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afabf2e13a7ecf249791b85f7cf8c05071d3a8f83994d6f5a19ce426677c5205 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd0f9de4b27bf419dbd318399a2dd12b45bc433d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:294cd27eeb7e9b958426cb1cb4e2b9db5cbceb42d73b3576934234e594361e98 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08de7ad7e0a42f7705513ac078fd89d20dede65e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aeb41273a03ab045219c890caf0efac7a8bd67ef1bbf76c1ba090ad313e4f498 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86e26b9e20d715c341d9c5197031db6b95f261ac --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:606eb446803952a99e76245d4d44c80db499c7cdcf8ba04041272eafa71529b2 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff61b11f466723e34919cf1427d22f07ebd225cb --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9aadab1498987d7e9da79b6326bab41b1e76e268d51a55c40868ae46960de9e3 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1672c8d99ab2cab40ec5617b8179517c8bb43ae4 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad7d741f2784df06632ffd197dd99f0e599d0dc6caca2137ddbeaa6f00745a9 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35076faf9517ef1da8b1671a1019b82dfaf91207 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81412c76dab39fd12843a3e636b1a3e3d5b5fb651bd561be31132cfafb450f48 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45f6a6cf5fab7d59d588e45fbc7454cd3452f9dd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:241933d847671c50e675c317912a05c6492b70010ff3a315de1d2d0ec1ba8db6 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef3112df87176602aa2b84cf382713b806c844e0 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27946ac85d8c005c89ca7aa4ee3a719846dccce4c25d56ae8755dfe05c8139a6 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d64d7c96337bcdc4f382eaece8cfa5555febc467 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6807df22aaea5044cf008cf5f38694ca7cef2e401dba2c3c20c3d71db742ff7b +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..115cad8a9fd7292939337801007e713c26aed4cc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9428a40d1890692334e4eefc0fd1497e3d1e0ef192542488d4994b68c08a1f33 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2694a892221da306fe4ff653d9aef03f71591ea8 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e420963f61bc87ecf0113ed8330367c2ee0b34c57f2e487674d86b71817b68cb +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..966412d151264ef2a9746d8059fe4b51f2be2cfc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c22d1387186085020156397d234ab82246e4282c8617f799c72851c14d5f081 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33550debaddc4cd27f71010c5b87ac53968c106d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:672a9520b1f8b9fb6b652cfed2d02d9e437ce7b899c5da22efce3454b8180a2c +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0047326d3f8924c21330385864b2ef4415d8e1d0 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d40e6dab4a55d1a34f6378c6ba04dac2d00d313c65658a9a691a89fd4f7ae18d +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfef3db23f59b1f5959a4adbf06fb08b0774c0b6 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb57a0b3a257e821be08b220f8c73e2becd099888ed25378a493c3ec0e53653d +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6999d9bc12e33ecc717b7c8e57709bde2cbe5cd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8e776dc0643e34156294067bc2acb6d48ed9ca48a8e45e9beb98b1206ea502c0 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e51578749bb90913e050e0b3c82a671c7a13c8b --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25e6dbafba393c1b73d32365eb38b4fdd5838dc247285fdf084bbde096e0d75 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c7b54a4dc95ef3369faf8567fa6864387ad2ace --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7dacb3fc7e4df477019bfa11659ff9c10015a91f3972eed4f40fa596a1267dd +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea1defde171632f65cf635e50031efcb2b3c0f1d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ade8c7ddae22f3fbdfa765c4d9ffcef45b0f2462b932ed16a8c71020d36509f +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b211b5d598641472da9aa5d5c4c35f399f45e6fc --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2790807756c691fab54f72e464eda780962f31ef9bf0eb8255a064a408eeeff +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e57ccf969bba4baf297ca046c58a9f1840d9e667 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:832666217b8b589c5f207f54b7a8540d703c160236d62731efa7afd6f45a4d63 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b04dfabf5ca8119da7d4901a77bbd0c4df21c4b3 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1dc7eba207b59f70604dbdc8cc5072f250e7cc6d22fe73c5ab8be014ba209584 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9302f5788b2b976091015a3507682eacae3372f5 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5896ebfbfb6e4d002359e641ad7f014dad07ecc2ce1d2967f393172de88b6bea +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64eca9dd65c35d08301b808849f06a72bbdb8acd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:869740327c7784e7d0c333adccd342ebe8022bd039612f015699f896caaa0cfb +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5174973e9c1aad5da4af1af322b0e28a493b3278 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18ecaf8b2782843029605fd8092c4d593ee1ee0845557f1021ea250d2b8b5bdd +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f50e114f8e63b56968af259c77da478aff781a1 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:493df75716e84060920bdf750e28724a5c96fb2734526f22e090831e8b9a8124 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3631756c044c19b62c777bdaf841f170dcd9cc86 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85c93800e97c565f4829aabf394d485d72a8ca73259628c95f24a11947224533 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe6509789b0bef143d3918ea4ecd04e5c6916ca2 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12c670aaabcc8ecef0d935b27ccc47df0cde5bb4d1d2ac2511980565a4d291d2 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a376b4f9ed6ca376dc90556b0e91b3d42046f2e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a8330e00de0a76740bd2b2a1f5dbc8315ebbe21687ab6773dfb41353498df56 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1abff3110488e7852bd7f595b8b874f8b08bcc2 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:db6e91372460205ccdad3d6fed0e983c65808068296556b2f21a7f2498fe7b71 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40434abf651a189f6eb3041628029f8ecf31f5fe --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:354b6e140f698ea923611ea6d8cbc85cadfc2d460d40b820ac1572c416cf1c6c +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06449568aa3871d60c90c3640b25323fea3f7667 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df3cf7420dca4351b1ba0cbf7c4eec9386b5d25c6059f59d4bf46c4f099e3418 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e4eae241f473786dab06a60980edc12b039dff7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b690e20f910d3e792592f42415209ad6e61d206f4018333e6820a3e8a19425e +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6475f88a05bdc6726d9016263f8931163d861863 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35c77d6eef698f38913338f111907a6b1d0da994340c43c700a88efd633d9946 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6de7524bbcd4f498e9584c721ce94b76e545c298 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a3e056d980bd633376e722ad5bc31e45eeb1d3cbaf4840ae39640eb00a4e18f +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65a4bb2c4a81bc62cc684f0e22fbc4712f7bc44e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:557f37c09e80993d849abdf9ecfbdff461529c6f393d3ca3389dd407c9d04a22 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6416d2e02919c6134eb4809374243c511506b310 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76720c5081cf3016947f9cba0f594e0f34b98317a324fe78b7b86324a178f673 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cac91dadb9a40971c96fc911d2c5c34062ff02a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39b8f5d463be4e533889a8a6f76aa3eab32db6d2e3372189f2b5785c824cd421 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec0c53b68836b8c2fb9c29253fa507361677604f --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f12477e5fa6afaf2c23e4625c64a8101b0fda66d803c8aaf43ca17525749b912 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58d17f830dfd021c2f2220f74f2545c9c87ee478 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12341a08d385758fd082de72ef9a8258f9f21115a48f4fc5452681328253915d +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e88549e1da60b218d8185599a7341bab1c046a1 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b1220dd1b28d517998eb1811ba5e4bcbaf3c416b0b10388c73307d73ab72cc7 +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89b5442f57d080e369194fef83abac8f997b38f4 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:176eb95183e2c7d95feb4006da3af09ceafc40fe4b9e19baef253f66395a95c0 +size 199058647 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9bb04953e5b6c73827df223c97936799807ef34 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e03d719054def7ba064314082e632bba116c7f47991ba04f4d24526aa046623 +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d3a21a48e9852c7796a453f422823c5c6868b47 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7a49f1769ce230f2363f380689ef8886ce98cbf101ebbbcfd345b93fb0426b1 +size 199058850 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67ca0b2730f656f4c04daff8cbc2fed24bdc231b --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13ae4064e7c4132216e11f0d5093d5db8ed8effa8d2b61307d987f8f23c77a25 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0987ad84664ae5ef51c62d7b7e7d27568660f582 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3632879fe3afea1f8fdfcb831fb37adbf2fd53507d52708c3df95bac244a9df +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..889b8834b0010272e0f378675ed60475d46eef58 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6fc44494bf2f90374ce2d9c084499dc36c0c705a0a6803aea2d700ea49cbc35 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35c3c540851849068f46a0a21dd1c1f276daeead --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d3d9f8991cf02a05e55c2299d8bd20e72dde5201a699658ac6fff311d1a26a2 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57d64d542bc50021c3d5b4bcf3dc9cf9632e2708 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:686df770e1bd0bb2575f02349be98cea9c639fe1a765495b1ef6cde554ed149f +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..964232c9cc43e8727da5423a2be832349e0c9e04 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f368fc1eba1e218bf36629c600f1fc5db424c01d8282b4004ae859bdbc747196 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e29235260758f267b201f91a3ce4a4f87d77b62 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:214a556bd6b7db922a34dfc6318d3ee1508b9f811a556a65a3aece303e18b30b +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fec2afe1ef54ae800d2ab9a14e624ce11f9eb222 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3b55cb3e8d0b3ba360ac9a56987437a13b88163e45638a3b21300816e2188d7 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d2acd579bd814fc54ea696398010c2ecad6cc9c --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77b6e7788783a9f04004ccbffcdb76020518e9cb6c85f0ce1aa651e9994b2efe +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e76874abed9e0b0c954913bb2f78352aed43ab6 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a3ebc92983cc8eba855ff6ab3563c8b0b17c60d604ebd96297ca8d916a9daf55 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ede01c6dc740e76f319e5b3da42947f12e20b68 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4f136162e989932b158874c9bf699fd9c9aadd99e1b7d0a9f0b34f8bc8dc700 +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa9b73b42d97b1b64912d0cbfcfa966e0d97a1af --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7338e24287a442e977ed7552f044dba8c9310a094d130289b66f9d3d7fe846c +size 199058722 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3e56205c6d1d6d48a19fa4ff5963cb333e42e54 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e5e2bbe993505c2d81b0257f1bd9331eb6dbff4c77556f825f89f0dfb608ae8 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d31eaaca12939c6531e2ae7d71dfd4fd8a77acd --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9c9da4f659b9cac3466eea48aec7a18bacbaaeb3f80d71c3d32486da2883133 +size 199058786 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3793f2f664f7a99ae26718368fda1b0670042199 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dc04dbecd912254864605ec268df6ec0aa92025a3ad105450fff6cec67791b3 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f793b900b6bfe61bb7d549e1992bd7d7b3b2ff29 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dadab95b7c6388e0a8a645071388ca2af0adb43caaefe538c3894e6dd75563a7 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32877bbbd1e19c0e78dedc330510eca665bf088e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b714f30f82125b520008f241ad8a978e3a069b1aec8ef3a1c83a684bf334f6dd +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f32a5a6f795a8ded089e428efbd766269efa4d0 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b27f26ef7c0bcdf1d32ab05427c83884afb6ed74d6e68c4640ce97b8810f3a6 +size 199058658 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f8260f97c5da9364b2b2926b9af26ebe060907e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:446d4471c9f6b19426173893d4956e3cc49961d114b538486e1999cffcec34b8 +size 199058839 diff --git a/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7fa79ef12bb65c6801a544762ac27ee5933efbe4 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b15aff57ae9bf652035cbc59132b72e57ecfc0ba6ae8797adba26ae7e874b367 +size 199058839 diff --git a/4b284b6bc4seed1/global_step80108/layer_01-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..05568675c4003e3c4f640cbae02a995f76631065 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:57dcc1bce8067b5e88c59a4b666ff8fd55dcb32cede952bec532b5c029d4fcaf +size 167511299 diff --git a/4b284b6bc4seed1/global_step80108/layer_01-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f5b4890ed8055f6f5260a7c5cb39660c7746a11 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98d65df3794841782576cb2cfcb7a60f558e6fdcbe928ae83fb1895c4d3bd86d +size 167511299 diff --git a/4b284b6bc4seed1/global_step80108/layer_03-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b39476ea185281be5640fc385c72bc6d3ad2ea2 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c88ecf4de670ce999cb0a2eada704a6ca004f866e6b7ea5ef0e89355b8dec7b +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_03-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..566898fa8ffece6d264c07e9e7542bd6f9d3ba7e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da37ab9e327f214c7421a22cbb27c1b7f68e18dfcf9f5ae45abde4b6239656e2 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_04-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..743d4345314a0c6fbade7bb3fcc5e886b95c6ed4 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4b7b2ae8e5e27310a4f7a66d1c339a0f76c94162ebab85aa59744b3c36fd5ebf +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_04-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e88e5efe791b1101e4f441ea6329aa8abb2f425d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bd97fc17824779a7580b5b4d1d9edd0cf82c87cdfbb17d7d5ba92130d368f965 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_05-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e908544e560a65230a32d04bf043892a359855eb --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d80804c6b0a3d93f8a19235873f314b21a76cc7c7efb8d10b8064d68cfe773b9 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_05-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..928790344057ad41d272013041708bb8acc87f62 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1ee42c249e3019cae2502f99754c28f00e8968a551d8aa9c69019f33c83c989 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_06-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c593de000cbfdde594f67f27a5b02df513f3094 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:65df4e9aae0c8a51378a893f389d3f170d16c14543fcb0d3b812afc14bcfd383 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_06-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bdf6bba1740e94b7b7f062f5c10c8303d1d63ee0 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce8ed8d8d590381fa0170d658992a6f9fc98f6738f72918822584cc50544a93d +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_07-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..317fd40a0136417f6c8bd708ee98d3ed50cb1835 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:337a715ea5ab2b725cdb7718acb7e877337bf6069378b9d9562ce823a49354a3 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_07-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a70bb79782581d381e55f8b005ef228119fa6e7a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4de2a0cfb67981df7abb767eaee6e6483b956926d9a8c693ad57da6b202fad86 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_08-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa6c778e3ccbe1708a5ad4188cff216c5d7fa625 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6f13bcffa3e89017886a5e99e79600655c5f36ec1f397a26bd78fc17d7c42e0 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_08-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45164f8184ce1899880ad9c5bd6734bc4413041d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:82bd42f23e15be40c46143b666315f334f7aa014a34c56294652d0343ca329d0 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_09-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3df02a83cd9ac872bb9a1d1ce3d3d15f22e50ca --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:839ec97e6b79db87444178a0b9ff1e4847f91716d5ed7cf2954f035fc5c3e405 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_09-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..244fb9dfae84d3aba5d3f52e43c5cc26791c85b8 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b09b4fb1fc3e9555066dbd351902015493c8c707b513c5008d4eae46b2247b5f +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_10-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5517c9686a57be7cbdfb2c3ad75ac5ee0eb684db --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43718e9c44ed78e413d107cf1ab85f290c6b1ddf7bf51e17be9f33c61f990054 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_10-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb87962d9f9ffa1a3bfc71692672137f329f96f7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7373bc762d3b9d727d1f5484010c4dad60932859c9fb879fd077d6cfdaec280d +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_11-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a6c75fa2e098b4f3ec82cd796e00fa35933e24a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f6a28bf7c31a7e4a4c5c549b4fe392eaebcf1a498cdd9534ff5e6800230cb4 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_11-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59d6ed9d04be10c25620b9e8cf5b7ab91e617b91 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7c1f1035a9f0d6509f252280fe52579d89fb33e3ff4cd851b86bd31bd7a7f5f +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_12-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e150b2a98948f0c9363c1024be137deb5951b72 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25e9b0c43f11f1883a7563a97dada09eda9121bde953e2c0aeacf5dd927a7da8 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_12-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10f7c0c11b0ce385f50652b9cb719fa410ae1fff --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:557729cfd73339a9ba75853a6986436c525bb1287cdbb6ed1eec8507ae6b079c +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_13-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0950f096860d0f3cfb3094a1b7fb43e05659a5a1 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15b6456a42838165f90c7a62889d3de8a154724fb6ee22a5da76ac0d2f35fc56 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_13-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..486dea0fd3ecc4e6e16b5f3ee607af36a46c871a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f0ee62dea2a3a72b6567a0e629860a474bed265bca0274eeaed204d9a13a3b1 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_14-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c5ff01b31aeaf0dac632cfb095cfd3746575f5e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ee3ab3b67fde04a28dee82edf2c790b1378b9ce347970c44460c27aaa7f3c28d +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_14-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e68b17a9c6874a1302d13351dcc0cc83cc7a3a21 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3de5796af74b809a71b2bf948bda65c66d83047e94f1613d6cc56da023f0b8fb +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_15-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a3da68fc1d9815d4496cab90ea068434238cbb7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95d30ca410b2b6f985d719b7f2c9958d9c28de2562c41a61d5ad1cedf7d34611 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_15-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25f548348b3a7a765195e418755c25d1c3108ac9 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25e0e6f0622d63c2829e1fa738e1b1bcc8920813a97238d4d3874e4fdf1108c +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_16-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed5909c8e0ae22e0107103e91e3bcf1ecd55dbd9 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1166695d48ba74ead44f17f76fc58d5a1739273561f43cbbbea6cb8bcfcea627 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_16-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d22e72823c950278b5fdd315cc499176e03b20ad --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2e756fc9f1bc26b8c73a8fd45f384e603d5c5ef7acc8e6a7b50ec5297a2cc1cf +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_17-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7c63837ef77069ae114af414f15dd9fac8077b3 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5760c6d44f95e38f680315c959a24117f2fdf0a27e1215ebf5129660d0b2362d +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_17-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d45bd68299c85749aa494c48393553795850bdc5 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91e72359af732074a3b42e1cbf69bb5d0db6634bf2398882d3e713fb02a338c2 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_18-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3fcc00b454726af25097b1f3eef358b22013e74 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49f2b8a8d413da37d54f3834f7666a0dd3faab3d0aabd3ce3c47c991bc93d5c5 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_18-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5ff955f63c2f553963bb211d7bf7c5d42c70a66 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab6e100e86709cc0ea8d3a3365a192fad554dafd2d06008ca8504f4cb9356955 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_19-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b625bfe6e91635b42d586e47a9dffb99e5a09486 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3012f30f9566001542941764fd89688ff2b6583b225959e040355370862dae08 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_19-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01927b4aa6ba89c16fecbfa110886dec32d42032 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9d627317671280554761e0814a591ced513516bd49df125328b1c43861a6ab0 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_20-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5321bded08a5542db1d7a015e43de847cf7b7149 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b287f0264164351324201d2d136e41bf538b738981586989cae4a1cb3d4c4809 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_20-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6084f93fa88df34e0140c1dfb1613ef1d61a910e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:10e4b5a46a3c1cd6be9011d6f4f811aeeb2b257d312fa947e81fc91465a428ef +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_21-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a09adceb051c0dd0cedac7769cd4edf3b48b40a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c80e21b1240a5e030b12e8349ba362d5f8d31a068036c15b1dafba001e93c3ac +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_21-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e822f2f26c07a024614e59d5dbd73cd9afbfbcb1 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e6203c0b15a67f2aaf3482b9721606a07f9efb3a66c84dfe0ec99097298d4b67 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_22-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43809f08ebac58f4a09e7110dc829f3fbab565b9 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a61a74a0a343565cee7558898f8c877bdac138f5da02e1aa344c94849a4ca364 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_22-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f26bfe28df00929c7d62096e6a0f8438cb86a017 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be19655cd124b623a37f01f32d7040ab06897b82393f733841b47e86830df1c5 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_23-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e5fc232013c9e55e6da939a3fce9573d8f291d6 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f70992fa47f70ddf8e872ed7566733369b3efc213cdec2472389af91f25118f7 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_23-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b350d2a408ad8819f843f04b5f6a6580be42e5c --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e727770b3ed61de37118cb6710664da5c273855dd6c352add1c9406d11b2476 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_24-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e07df0629746749e20c2934ad83f35a4c45fbea5 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f56e444ff1c13785055e3cfd30fa97ce31cbccd0174378838218793f098d0d9 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_24-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..78b66994140b2da21ca54e8f21908815a1a8185f --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39466db7cbd5791d5b6c8e7a09b0a5ed2f57726e99c803bbbfc5e8baffb18499 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_25-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc9732573e42d0e7362f7a1b1e7d094c7256db45 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c904638fa78632b9f940760cd278d7e40edff9b25026da9182c8e114f14c100 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_25-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6964b2cba43c66394234c9970ddde9a580e611e1 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1342b07ddcc2387a37d36de3767c29b723a80cfe24af75caaee013a1f1f64912 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_26-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c56f3ff0d8f4e93b4a4e44dffcc6fdbfd1896ff5 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0129cb7efd40464e66a912305267826fd24758b76fff5895a717ace5df74fa25 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_26-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..387b2481c547bbfd6290d60a2bfd715f16745b90 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff55739b8d5fee23a111e0120dbe9f00271dcbaa1e5f28b4a36de64405970161 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_27-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ea8827e035c4e1fe5c91a035ec4ce038e027ba25 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94032f3b3d275ec02b4593d9d9085ca20975e4d5fe590b645514226fa4e5c159 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_27-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c598e97d967a10bbf09739a33999d03fa05b0e4 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e70452a8529ed0f18e8859fce055c38a2b881c9b3a9d57e0dbf7d2165062f079 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_28-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c8aad35fe5534926dd45b88d321f5410f5a4fff --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:350dfda9df48428cce6ab799a58566883756bc4ce96d0869a9eb84e6236b956b +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_28-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..08d73f5b85118018759ac56bfbf884a7ab25b810 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:529a2aca3884f7734b74ae811b9ab42a515bced41023bc3a4258b9b4394d4c7f +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_29-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7b7e605981cb898d19238cc1e6e8c8113cf32c66 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de5a0152708493a16f4261e17465f6bdeae745e0c887a78588ab831f2442d188 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_29-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..664be8284650cb6b3e62576a5233a31d20f1eee1 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c4ecaa610463fff90976667129c3e8d1c5f9da72baf592b95d937dd7f512a28 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_30-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4688b6ea45b0e0fecf41c2ab3f1050545a0c3b4a --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37cae25067f72d8aa8d64623a979fda72545c8fb98ea530ac2374c0afb95f2f2 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_30-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c28471d1525fbe3a53beb5721b5d4744c3b3cca2 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b837a29c5f401822ca125884d72203feafc8243d2cdd84c87a52e995506f3e78 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_31-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..925eec89caf4f31a4c98d3ac7ba1544c32bba7f5 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:398419471720bffa37cc843d88b7a437d654fc206f790a865ec313dbd896b5d9 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_31-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1c061521018a0d6ef00b2704f30f349c634c2e6 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d849dcd5b768b111400e112e3c919c8f29d8e3050bec4161e5101ec99b04fd42 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_32-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2eb9f295ec9d06333cf05201501f3617aea51b8 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbcb27421c1cc72a42c9c85e04232f397059659ec29e3110c2eb9cc64f342193 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_32-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60dd16898434f1d6907fc37487883e7dec36cf71 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e73b789f2354af302ae732e223f3969c1fdf7c57d57a0092d42dad8ffe7bfc73 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_33-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03e74034290e831d1e29095e7b9fa9e3e06b0bda --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78b28f357e10389f7ba232cc592cb20830cd379f1c7287c9fceb8105b23138df +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_33-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de249c7c27fae8415fa6a10ef4b42cd9252cb572 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68248cfeaf2b1532caf1fe0213da39fb1fcef11085c1a98732954ce266f1bd41 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_34-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b07c97bddd587173f29a598dba5626fb28579dc7 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c19f43154d3bfafde204e3f5f514e64ecb13ee232d041a9c9655e3904388cb2 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_34-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5d836a13ed00de9507f0c19895e80d8cf034fa0 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:434ce0e0d0f1fa0e1449b88eb4e1a73581a63420e503769ba4264d26e34768e6 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_35-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf1cdacf8afeecdb05b8d44d2dd7e293ebc60771 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68e342ca7203f89ef5b0a8fbc65f01dfed91fdf3d788109f28260409be5c1840 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_35-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47c8b9ee33ff2e46daa0b725441259c004a92fa3 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:663d0af021c4063848481be477cead357421e996c7322070c0977f0675c57335 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_36-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..725f6dca704a1a4d6b6485214e980966ed644c1c --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f1ee2b5c3965da1edd1da9796c7111df47e9808511a45094ebb48152901992f +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_36-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf3bbde57a7d4827cc4fa1274f609b7283b6abf9 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e2c30c8e1965cc97b2498793fff2792c2c55ad7bba573dd41611093d961728a +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_37-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e23643484f5fa2601e7a15e8ed851f42880367e --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:362f2e902cba5c8ae7b40b0c0df2aa617683c29020ec32d768431c7eda011ddf +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_37-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c62b7b06cd5d51e5bbfeeea8fa78b722ebb735d --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5a3bb443812686fdd630daf78176765b068febb7fc76385c3f813f28a0c5a36 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_38-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bdf37148cd8d0b72be8e036261101171574d516 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c2e3db5b69d39f585947d8b55a185ba0d7fe88465f78a374a27442df5a0e55a +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_38-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..663e9b82ca34afbfed83b9e4eb93cec2c7c882de --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77a125a1a5a2d3647c36486ff01eb9ff88bbc17d858023d74d860af067f1d807 +size 113308931 diff --git a/4b284b6bc4seed1/global_step80108/layer_40-model_00-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0c3ba31f17e833a8ee5fed5d230e7a29e9901e28 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:238e1b2e0e460f86f86669754b2ec5642dbcaba2cfbfbadd44265080834c0de0 +size 13507 diff --git a/4b284b6bc4seed1/global_step80108/layer_40-model_01-model_states.pt b/4b284b6bc4seed1/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d19badba21cf9a350d5e3a5fc03fe00561d8770 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d416715982116a399ff1f4300ec9e45048be8351b99178a3606bbd3ea29c132 +size 13507 diff --git a/4b284b6bc4seed1/global_step80108/mp_rank_00_model_states.pt b/4b284b6bc4seed1/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..627351e580e58e287821afe8bbc63e2bc3ba0d87 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e0dc925e735904ea4ed3ab298d4cc378c32781adc091606df1e01ef812e59bd +size 51507 diff --git a/4b284b6bc4seed1/global_step80108/mp_rank_01_model_states.pt b/4b284b6bc4seed1/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..497d17da0c75c03f76bfd58f034aa4d3cc2e9a45 --- /dev/null +++ b/4b284b6bc4seed1/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3629d9f650dff60248f423528e32d5f879f7440e25dd0bc9cc5ef1dcaae4258 +size 51507 diff --git a/4b284b6bc4seed1/transformers/config.json b/4b284b6bc4seed1/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b6bc4seed1/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b6bc4seed1/transformers/pytorch_model.bin b/4b284b6bc4seed1/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..52df0bf245c320293d1e6fe8c754b3630e7bb064 --- /dev/null +++ b/4b284b6bc4seed1/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f10ae1134d88b43641fd2f491289a8af85dd7e622af7f37adc3d6b5b2d5c43b +size 8781203669 diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..af0c716d18ef09f8b69355668e17b367c316a5e6 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4505969912144358, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.043025981663977676}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07715680688754782, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018501494099723034}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.32800192332635164, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004716290361046614}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11475949399291512, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020930584454703313}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03691606942766564, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001226252004533247}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15714130080850514, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003275285581951961}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05421096419841178, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013323602620276317}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07330043188559601, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016882205517441595}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.31747468696171116, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004607770796206798}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1095828810892153, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019205919592418358}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07264308016772093, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001734436368694926}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.30915040739896027, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004387887182362267}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10804953744361874, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019462325362491339}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..336255de77ef604a0c826c844e871f0eda55914e --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5248973715012223, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.04500340113008066}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0790761668773179, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016843496475256363}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3697333749180133, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005009866939283317}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12116080004166574, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002034248506156313}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03678510490686299, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001081873045114326}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17843660776062029, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003489215109878396}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05647199175457009, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013066532545353317}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07404916365054973, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015255606390290489}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.34923402691643046, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004687346760287558}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11376961245179681, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018264898168477456}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07445381060380506, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001593181333906948}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3467160374634341, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004579407380382054}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11395978695320426, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018994693226140945}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..115480a41ec6f2538782fd5b96784c3f807e8e33 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5767647931281593, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03075444324731624}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08030107100423996, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015674832760453747}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.38840421585850693, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005175482568072094}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12441199271565954, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001979354566482751}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.037112804584329, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009141020328534724}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19070965082945687, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003653414412934534}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.057979391263589294, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012537328703996166}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07384535953637529, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013915854560762077}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3595423504669609, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00473567632900781}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11464846086222981, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017509905495136865}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07564699950143948, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014680313985962644}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3655854110990312, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0047861725768252785}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11714224514649191, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018352989430204284}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f3dac7e8e7ef24140e0730b00d7181051ccb8516 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6551242086874565, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03786184470041364}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07882570317453028, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015398380099203338}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39347312457818545, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005115592107070138}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12253462963491722, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019458379147742845}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0365856093502546, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009020386358581405}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19448869036942362, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036911175236007915}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05738575356669148, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012433710684840093}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07184479663593357, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013555990593936752}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.36011891059508755, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004569680331874904}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11178706827138284, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016888026831589167}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07401320225138429, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001446688093860126}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3682561684373326, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004661037301261206}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11492232075242285, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018044818590991203}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d344fad82fe7379df7fcf0100b4be97a2fa2056c --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6361569019073665, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.048795806087287424}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07936192579865504, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015426897773666887}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3967228621080476, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005035788052603314}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12333237651607433, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018995495239739787}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0361795830053176, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008771942709925916}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19495589680109515, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036179457975666733}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05685164611012959, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001193840199959299}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07239948675670523, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013748540153599564}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3637724702147103, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004528167648238907}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11262522353373274, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001668123718914031}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07461562643114039, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014456314194904961}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3734381336992152, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004658729212112421}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11594403375103957, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017604845749238877}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..8c8cee76ce8034aca56a75543a5f08dd417428b5 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6348116381689767, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.025032005928245744}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07772480241459157, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014761937289481531}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39775384294624816, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005043126900140792}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12151531670936837, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018013952412054407}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03642686374060602, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010535500618274554}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1954871545530622, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036330438060616513}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05654046753025775, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011574259112533843}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0708062283164349, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013339231845929654}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3620745179558994, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00449776594486043}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1106233752219019, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016037607255517253}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07304451504316123, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013879168010522463}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.37251915128720225, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00464816980850311}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1140750876332385, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016853800565220047}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a996e812e6540ee08291268ee9c5f9a75753bbf7 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1603204965143781, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019055374186705493}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.273148053641277, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00271429826551829}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18760609214914972, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018528010283896678}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03352653833860025, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008141842668329252}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.059532665192850664, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001495886372304702}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.039553536857052096, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009080316883759782}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11956609361350197, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001288770553600895}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21092821240171705, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002145023872994803}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14148134446020433, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001278578656113803}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1475742184322245, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001744563798127783}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.25286325424170925, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025434557707113424}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.17295948170907235, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016989010001995553}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.7934141534025163, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08383146848244837}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1e34e184237824835ce2ba4c6b3ba8ae61092283 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1745195547370322, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020211127459286177}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.29756863851182014, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002720442694533944}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.20404111705603262, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018961046573895371}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.038836287518126324, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008918673703720118}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0678582672753382, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015726696869910164}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04531387019112246, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009454489412507513}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12403344533976053, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013370363902071867}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21966745113211172, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002148471848315497}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14662233559425056, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012675330724451579}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.16262281802775871, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018832504839498365}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2785759841913255, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002586017885803777}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.19031232879553658, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017631603815569407}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.2027676863872756, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07884539943019493}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..8b66a709837cab13fd70b89fd43cd856a7c30610 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.17812583517946007, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002009945937748485}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.303539848216664, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002638500102412918}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.2078510077674295, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018302477945332431}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03988619638649071, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008528640674491505}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07069101771037783, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015418058212234357}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04667487755408923, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009128949090939083}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1260062676909843, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001364424629646694}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22269555369572, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002089758754681962}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14847289603046035, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012287208530959888}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.16673210140327593, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001876553104110706}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.28573976969483017, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002520262824141778}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1948747340586584, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017076787007878865}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.3891366560914298, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08062856329183088}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..e0b73360a879072382c6f1c42138a18f866ed349 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15466504916141774, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002308226402178308}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2551520537583065, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032171951632609264}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17428261104968168, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021443814628730523}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03492860218651495, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009155361590863039}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.060501291725340245, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001568003123293494}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.03952258753236028, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009033133825001278}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11061065008297513, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016789233374586393}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.1885220916112058, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002535325446834288}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12499242197529943, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014791492005730253}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1453452296219742, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021599240195076573}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24088194688429895, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00305926261571982}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16396063897113883, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020097929828463102}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.38911546645986, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07647894828583013}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9da903e42cf76f7eb41171c44f36ef91ed8457c6 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.053018296777332476, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001989950046503427}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08596667050742965, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002947649719879261}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.056665547293806504, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001891719846577204}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.011358703706930581, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000600320864289757}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.021640340405918963, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0011802802866629615}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.013047921347416528, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006398386351669672}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.03957496787938521, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015124056846112217}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.06552651052204829, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022922651246891222}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04210570382315936, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001378676251875729}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.049771628442206735, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018700031303863793}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.08106940347167176, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027897599646264986}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.05326532550449904, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017732306920814024}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.5396555354382301, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03382350846346006}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7dc8dca5bcd4d20222c631938cf7af926f45830a --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.008477708430630778, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008888303927431226}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.013378525794197375, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013202915810629089}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.008692457481160468, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008227750799750827}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.002035592041182627, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0003440486575723203}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.003334615800958582, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0004964329628462136}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0020021672595433877, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0002655938544483011}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006368490138883737, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006824241585392732}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010162399165178543, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010265436936400937}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006455452264291404, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006047126016011451}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.007948184602390525, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0008399495471791939}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.012575544635440476, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012445710338658724}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008133155428782728, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007677758628473678}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 6.626695028697088e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.1951854876786307e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..ee3b037f9c1c6ab58079b0509da9290459349bd2 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 2.878712808592603, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0853866064382545}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.12473936122211624, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001798387415150618}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.21205919428582165, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002854707525591281}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.14598569647435716, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019257642313717281}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.03495666955822184, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008687034534547671}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.06654649371061956, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016084812198622184}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.04387542635560367, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010442399588521244}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.11526993035626307, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001545375812569594}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.19660657514045912, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0025255577441268087}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.13483368037365023, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016578290285278543}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.10944292922104659, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015541855309834716}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.1856831740193031, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025479048755850213}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.12774057149590898, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016934965354593117}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..fd99988ed35a3430941cd29e645e9076f6e84c12 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.756713461785154, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1556457646527884}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4098430493296336, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002322243350403215}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.44204106174129115, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002648076916437811}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.40687267868315097, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018487565527517862}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.17194753805951837, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0017305953745273977}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.18647781584399134, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0018885402575458418}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.17029119687013236, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015443604787036918}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.28268352481109116, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0019277807551157933}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.30476888259625023, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021362292770155254}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.28000012009488995, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015606595580042648}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.33736408060377443, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002189042828443897}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3634133186767332, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024561816405961946}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3345777715915075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001819480989061025}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e3c684eaba5a081ad07fecf87d058bfdf9ec910d --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.703365784320074, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.16108986784891388}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.392092480268303, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002302537065374289}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4700929192938433, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025952785236860797}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4101176075687606, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018267883175402378}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.17385266696101637, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0016739605455478718}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21043725627335938, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019419833439951327}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1817582009151592, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001527895144436596}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2694278866213945, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018257757886672125}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.32463760826780586, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021411692643784116}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2819491223195203, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015219411814398627}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.32676135279841206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002119047445904341}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3923976496945184, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002451591838805565}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.341970457946986, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017909707229488067}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..cd4b6a724272965727fe327a4eaf156828429047 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.761234651073966, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08117964062807032}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3769467510554381, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00213141802058671}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4783045642626352, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0025707591897062483}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4065423629912447, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001806841436683923}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.16918099441968293, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015053602189487548}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.21947419317279818, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002013053097487535}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.18366190818796568, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015116466616384265}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2607744983983079, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016830752871787188}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3333300743221725, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021979974365264774}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2817551356956864, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015262712862237756}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.31727007213590536, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001993439598512182}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40307149877627624, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002469750781351579}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.34229547153938067, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001786413003034628}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..74f9f25d4acfdb0087040c4305cfcd9849a42950 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.060481335729593, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.13006673690205298}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3804171250877555, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021190302719114127}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4780703069260566, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002533824939435917}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.40925099639651336, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018052362806663203}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.17221168629234665, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015253603947935756}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2208989636456487, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020171225023131564}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1863731784770829, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015333517641007584}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.26364753406030395, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001681924883574724}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3339558499615528, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022103390891101316}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.28431779718263517, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015550810673653737}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.32014456374564415, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001994286539846333}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.40252942143619874, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024450797012346218}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3444533365407922, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018019008736801165}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..648202e4d47a0432699caf766dba9f3a664a5433 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 10.242478339458849, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.15925298363618348}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3847914899421603, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002183175369376523}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4774457234022992, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002464818162721772}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.411488509635484, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018020990796425748}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.17466204582352918, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0015530402332911797}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22030265368490773, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019596071325407617}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.18753065960202087, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015196039524377218}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2682876782077045, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017434660077252258}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3357310111978014, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021781101054053217}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2877066533447448, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015722869589788488}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.32327624212453093, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020620269813736254}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.4015164129730794, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024008264881823175}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.34582724571038975, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018153943190470448}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_0.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..69b3e5d7f5e5c00c6bbef2b43102f65e0d0d8438 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.15562575636638382, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018985685959581433}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.37071290923313827, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00412806450314426}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.21561062837939882, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023994286403233862}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.035854646948925664, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011959015024675783}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.08777720514933714, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0028093393672125244}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04992047712716468, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015659162879365486}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.11410361066824068, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014883650475830462}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.27352828928489664, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033358267453375847}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.15823496005416243, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018701288881012726}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.12411547049969442, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016095217901991009}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.29756544693353426, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036531260756102256}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.17227583896279217, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020612622488592977}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.9895418658955089, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.058791202685981404}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_1.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..1300a146806113fbe30ca9e1f64dad99108774cc --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12450251214516139, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017701644559474019}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3066220711240498, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004028698629097141}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17500466633779274, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002369834619717104}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.022425235776437836, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009260101083179589}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05660716486590679, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023949778530059774}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03174368690811647, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013089569557441355}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09339225179828282, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012872208930509489}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23225364174357402, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003121701045125992}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13160921880048357, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017477071878516516}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10120518962461963, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014558021924337414}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.2508945472267905, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034731782884289226}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14248813343338157, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001971817720719966}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.22504315109096, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09308335353980157}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_2.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..388444709618e7d3b853acad2ebe9f1bef793283 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1234862615247332, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001784653293189628}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3044465438832426, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003981514741893442}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17365706390997016, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023744297279891893}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02226790525553246, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000942452403285749}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.056422620727974965, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0024200696931415224}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03153224014629812, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00132441371576198}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09368957768118093, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013169064303781464}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23355487572465355, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0031690210056585975}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13213102627357046, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017809957835749522}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.10021625167450877, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001468880768310731}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24963190949674946, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034860586627063653}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.14132095054221017, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019853871709270238}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.298794808823118, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09705115916767015}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_3.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f16608bbbe513d0a2c0e7cf1ca2993419515066c --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11844914382273448, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019201993243810158}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.28390135387162757, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004220868188703738}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.16354635610802612, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0024663949649927435}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.02107624492911234, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000925135660801624}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05264382125378585, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023516589207668815}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.029556549223572853, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012888784997271304}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09104582658177605, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014168096722186306}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.22075959991016572, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003328818909079906}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12619122655248322, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018579466532603177}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09565182333428005, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001567884974278684}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23135719936282417, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035958537292906803}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1324788344627292, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020440661672023576}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.3205278027479164, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09561115002496487}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_4.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0ce7f88eaa1873fa7689bb976628626f45fa3cc3 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.039205474045436915, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025102333275441356}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.07293349387654642, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004216797737450448}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.046239903656618994, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002631695063266343}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0065884676077519935, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006855012194927015}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.01391800911864852, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014107292938298562}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.008394359766787172, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008212624322810702}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.030224247701060337, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020534035064510973}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.05511074735500151, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0031931944384416162}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.034807968155924324, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001962639728158149}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.03234508109476721, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002152956064622564}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.059639154094017835, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034861307417076055}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03760898789185391, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002134288615760715}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.6426176499265798, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10944172884159943}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_5.json b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c0c4cc51d75c7b528d44f0c1038ba9a0df16847c --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/agg.4b284b6bc4seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.0021575243350025752, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0006054243071962044}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.001704266236696643, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0004652377643070007}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.001882160171017921, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0005176393078664199}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0003161470420071974, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00012902342640180555}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00022809737432378943, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 9.478510684431686e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.000263097920800064, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00010803201929354118}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0016748107867624196, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0004791518665809304}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.00132498621769639, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0003711043260363234}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0014623646787355947, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00041204303295078344}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0017284128450814592, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.000493769341153888}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0013567504004039692, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0003777491879943449}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0015022545826009262, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00042147455797712205}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 5.88065686206085e-38, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 3.723633937038377e-32}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..140b5a2deb006448d79ed596d0306cf8b99698c8 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:abd38833ae9adad365ff09dcdcc0d10e64a44acb0121dd6068e68578685879d6 +size 4143375 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..22bab3ae92503fe2a29bbace50e1bffa49866686 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cd67081a190ec728131a8bdea916f43091cce226ed5231a5ff966d9ac4c9cc7 +size 5101551 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a774bc04e4e9ed11be75ea8ccc88e892ccaca40a --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f81db16c41e9bfec81c25d8005501d268f7d9a056c92dc98b4f2e238ee7f61 +size 5988704 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fb07229cc2b1125f7171135a6f4f015e97b38d5a --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e836bb15e2b5979409e8f0fe7c97ea1dfca50396a9816d133d84c404c00372a7 +size 6911673 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d1cd74f082870bab4984bb83a7fcee09da74154a --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41186ef6eb28e62f43ef06bd3d1182d70801303a30b1fe30c74ee064ed92d4aa +size 7815907 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..97a32a39e1e9e10a94b8db10de7ffe6f1f54471d --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bcca4a2a9a9cb7a9e108f14cc2cfb6e1160f88e4e2fec66f72f9760f1954bd9 +size 8720419 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..774a92f471b03469aed314e363a8c04b5d9bb6e5 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a57312e8514732d39da4b9022376b0233b0e5b085ce21f54fac03368a92d42 +size 7694080 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c3315476d7eca6eb15b3d9c8e1d763cd814f21c6 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d52f1815df859431e629f92e75356499b606538477f1cb7c433c3c00c5a3b6e5 +size 13320983 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e430ac9ae06c0b2e3e255d3d1470c484fa6fadf0 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:af788c21ad97c519f026cba91d47cbbfb3d5b0a4e9f3a5724366d1a0eaa2113b +size 18926265 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d32b376f5d1225b0d0d15d18d8fdf4c9876cc1ba --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb7d8a022af87f903f71d3bc1ee29326808877195ff032d9d69755e52f43a39b +size 24343980 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e07800ba65f1140bce999c5787a5af0299df99d8 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a629dacbb616fc1f983ed589b492f084323783042a92d3eb66d2b68ef40d2ca +size 29476855 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d043ff7f7ceb927afa602c2cdadc09cf26bf12a0 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f084eba654011f33959af23c8018b6d4b3fa4a0370d1314f29348cdbd2cf81e +size 34799981 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7e1912165f9e668494fbccb8e43f32cffad223c3 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a283bf8b6868564e1ae510891ffb766d511188f024bfa3ab9fcc77f61f83d515 +size 4296735 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c08ce2b0c553500d53febb0add335742b404bb0d --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3681f3b2773dcbf0b231eabaef4cc9ee80c87d7a114efbe814ecdcd10c81de56 +size 5156197 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..384157439e9d02c5125d4d28f1f11ef0c61b0d12 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c69109fb979e7be557bcc2be8365d11e1952a54e873fb997e70ac62a976290c +size 6302472 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..576dc2fc6577dd710b37001a762fcde723efa8f3 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41c202fb5b75725dcac61736430379abbc7f654402980315ba1e12636d7b162f +size 7407308 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..8a7a5e28cfc4f0041b6621b6fd6d2e98a1d53026 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ca761242e38b9d364fb1a0d21649f9dd0497ab954e8390dd0f522a6c3f93182 +size 8476167 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4b3662d4ce9ab2b1574b48e0578a3a1c6e39433d --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60a070f4bb1a22784654e1b4dcec92ed6b1ae6a54ff55dd8027bbfadf1e2d5a3 +size 9556010 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_0.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4bbb71d6a22d88b7aaf5449e4c76ef138b1b2f3f --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d5fdb09bb0004366522ce3318d51a468c7bddd58cdadb56ba44c9b053e06794 +size 2831806 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_1.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..76542d5106041c3cda1f63c67305cc3d1b78f179 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90124f9e9baf23c00cfb75fcb6d77c332a410d976a8a3e98796c80eacc1f8de1 +size 5102955 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_2.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f1a50f936dd17f3654ac94aac8f5f5994b782be5 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dda8536a4f613271cfd77c4451b543945d707ea11e51a02bb0a01a94612bf55 +size 7376844 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_3.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1cb9fc123dd011cbdc4cd3260d089c5896cd6b00 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b588f98d3be864cc54ddf81e4446e2a49ac89ec1a51b52c1efab6b5db63b992e +size 9644358 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_4.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a8972661a02bcc700049fae213eccd37227985a5 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39e9f3e85bae14c9752655e9a2ec7c7e2de28e0319e4376d4655d422e52d682e +size 11672040 diff --git a/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_5.jsonl b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..60fc42319f06752ae4dc4a8c34b8300f265acf02 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/examples.4b284b6bc4seed2_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92d22ec8ef6315aa6e6981be4dce57c25f51f3a21a187c44776584ba0bd4e8f6 +size 13897555 diff --git a/4b284b6bc4seed2/evaluation/generation/merged.csv b/4b284b6bc4seed2/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..384388cb0ea196f0e55ea17c41c7e4890880dd07 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.04387542635560367 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.04387542635560367 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.17029119687013236 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.17029119687013236 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.1817582009151592 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.1817582009151592 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.18366190818796568 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.18366190818796568 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.1863731784770829 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.1863731784770829 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.18753065960202087 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.18753065960202087 +e2e_nlg_cleaned,5,average,multiple,0.15891509506799412 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.04992047712716468 +gem_xsum,0,median,rouge2_fmeasure,0.04992047712716468 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.03174368690811647 +gem_xsum,1,median,rouge2_fmeasure,0.03174368690811647 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.03153224014629812 +gem_xsum,2,median,rouge2_fmeasure,0.03153224014629812 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.029556549223572853 +gem_xsum,3,median,rouge2_fmeasure,0.029556549223572853 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.008394359766787172 +gem_xsum,4,median,rouge2_fmeasure,0.008394359766787172 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.000263097920800064 +gem_xsum,5,median,rouge2_fmeasure,0.000263097920800064 +gem_xsum,5,average,multiple,0.02523506851545656 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.05421096419841178 +web_nlg_en,0,median,rouge2_fmeasure,0.05421096419841178 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.05647199175457009 +web_nlg_en,1,median,rouge2_fmeasure,0.05647199175457009 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.057979391263589294 +web_nlg_en,2,median,rouge2_fmeasure,0.057979391263589294 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.05738575356669148 +web_nlg_en,3,median,rouge2_fmeasure,0.05738575356669148 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.05685164611012959 +web_nlg_en,4,median,rouge2_fmeasure,0.05685164611012959 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.05654046753025775 +web_nlg_en,5,median,rouge2_fmeasure,0.05654046753025775 +web_nlg_en,5,average,multiple,0.05657336907060833 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.039553536857052096 +wiki_lingua_en,0,median,rouge2_fmeasure,0.039553536857052096 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.04531387019112246 +wiki_lingua_en,1,median,rouge2_fmeasure,0.04531387019112246 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.04667487755408923 +wiki_lingua_en,2,median,rouge2_fmeasure,0.04667487755408923 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.03952258753236028 +wiki_lingua_en,3,median,rouge2_fmeasure,0.03952258753236028 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.013047921347416528 +wiki_lingua_en,4,median,rouge2_fmeasure,0.013047921347416528 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.0020021672595433877 +wiki_lingua_en,5,median,rouge2_fmeasure,0.0020021672595433877 +wiki_lingua_en,5,average,multiple,0.03101916012359733 diff --git a/4b284b6bc4seed2/evaluation/generation/merged.json b/4b284b6bc4seed2/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..9d5f95792def5fc070f65ea45a3df518a515de9b --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.4505969912144358, "bleu_stderr": 0.043025981663977676, "rouge1_fmeasure": 0.11475949399291512, "rouge1_fmeasure_stderr": 0.0020930584454703313, "rouge1_precision": 0.07715680688754782, "rouge1_precision_stderr": 0.0018501494099723034, "rouge1_recall": 0.32800192332635164, "rouge1_recall_stderr": 0.004716290361046614, "rouge2_fmeasure": 0.05421096419841178, "rouge2_fmeasure_stderr": 0.0013323602620276317, "rouge2_precision": 0.03691606942766564, "rouge2_precision_stderr": 0.001226252004533247, "rouge2_recall": 0.15714130080850514, "rouge2_recall_stderr": 0.003275285581951961, "rougeL_fmeasure": 0.1095828810892153, "rougeL_fmeasure_stderr": 0.0019205919592418358, "rougeL_precision": 0.07330043188559601, "rougeL_precision_stderr": 0.0016882205517441595, "rougeL_recall": 0.31747468696171116, "rougeL_recall_stderr": 0.004607770796206798, "rougeLsum_fmeasure": 0.10804953744361874, "rougeLsum_fmeasure_stderr": 0.0019462325362491339, "rougeLsum_precision": 0.07264308016772093, "rougeLsum_precision_stderr": 0.001734436368694926, "rougeLsum_recall": 0.30915040739896027, "rougeLsum_recall_stderr": 0.004387887182362267}}, "1": {"PALM_prompt": {"bleu": 0.5248973715012223, "bleu_stderr": 0.04500340113008066, "rouge1_fmeasure": 0.12116080004166574, "rouge1_fmeasure_stderr": 0.002034248506156313, "rouge1_precision": 0.0790761668773179, "rouge1_precision_stderr": 0.0016843496475256363, "rouge1_recall": 0.3697333749180133, "rouge1_recall_stderr": 0.005009866939283317, "rouge2_fmeasure": 0.05647199175457009, "rouge2_fmeasure_stderr": 0.0013066532545353317, "rouge2_precision": 0.03678510490686299, "rouge2_precision_stderr": 0.001081873045114326, "rouge2_recall": 0.17843660776062029, "rouge2_recall_stderr": 0.003489215109878396, "rougeL_fmeasure": 0.11376961245179681, "rougeL_fmeasure_stderr": 0.0018264898168477456, "rougeL_precision": 0.07404916365054973, "rougeL_precision_stderr": 0.0015255606390290489, "rougeL_recall": 0.34923402691643046, "rougeL_recall_stderr": 0.004687346760287558, "rougeLsum_fmeasure": 0.11395978695320426, "rougeLsum_fmeasure_stderr": 0.0018994693226140945, "rougeLsum_precision": 0.07445381060380506, "rougeLsum_precision_stderr": 0.001593181333906948, "rougeLsum_recall": 0.3467160374634341, "rougeLsum_recall_stderr": 0.004579407380382054}}, "2": {"PALM_prompt": {"bleu": 0.5767647931281593, "bleu_stderr": 0.03075444324731624, "rouge1_fmeasure": 0.12441199271565954, "rouge1_fmeasure_stderr": 0.001979354566482751, "rouge1_precision": 0.08030107100423996, "rouge1_precision_stderr": 0.0015674832760453747, "rouge1_recall": 0.38840421585850693, "rouge1_recall_stderr": 0.005175482568072094, "rouge2_fmeasure": 0.057979391263589294, "rouge2_fmeasure_stderr": 0.0012537328703996166, "rouge2_precision": 0.037112804584329, "rouge2_precision_stderr": 0.0009141020328534724, "rouge2_recall": 0.19070965082945687, "rouge2_recall_stderr": 0.003653414412934534, "rougeL_fmeasure": 0.11464846086222981, "rougeL_fmeasure_stderr": 0.0017509905495136865, "rougeL_precision": 0.07384535953637529, "rougeL_precision_stderr": 0.0013915854560762077, "rougeL_recall": 0.3595423504669609, "rougeL_recall_stderr": 0.00473567632900781, "rougeLsum_fmeasure": 0.11714224514649191, "rougeLsum_fmeasure_stderr": 0.0018352989430204284, "rougeLsum_precision": 0.07564699950143948, "rougeLsum_precision_stderr": 0.0014680313985962644, "rougeLsum_recall": 0.3655854110990312, "rougeLsum_recall_stderr": 0.0047861725768252785}}, "3": {"PALM_prompt": {"bleu": 0.6551242086874565, "bleu_stderr": 0.03786184470041364, "rouge1_fmeasure": 0.12253462963491722, "rouge1_fmeasure_stderr": 0.0019458379147742845, "rouge1_precision": 0.07882570317453028, "rouge1_precision_stderr": 0.0015398380099203338, "rouge1_recall": 0.39347312457818545, "rouge1_recall_stderr": 0.005115592107070138, "rouge2_fmeasure": 0.05738575356669148, "rouge2_fmeasure_stderr": 0.0012433710684840093, "rouge2_precision": 0.0365856093502546, "rouge2_precision_stderr": 0.0009020386358581405, "rouge2_recall": 0.19448869036942362, "rouge2_recall_stderr": 0.0036911175236007915, "rougeL_fmeasure": 0.11178706827138284, "rougeL_fmeasure_stderr": 0.0016888026831589167, "rougeL_precision": 0.07184479663593357, "rougeL_precision_stderr": 0.0013555990593936752, "rougeL_recall": 0.36011891059508755, "rougeL_recall_stderr": 0.004569680331874904, "rougeLsum_fmeasure": 0.11492232075242285, "rougeLsum_fmeasure_stderr": 0.0018044818590991203, "rougeLsum_precision": 0.07401320225138429, "rougeLsum_precision_stderr": 0.001446688093860126, "rougeLsum_recall": 0.3682561684373326, "rougeLsum_recall_stderr": 0.004661037301261206}}, "4": {"PALM_prompt": {"bleu": 0.6361569019073665, "bleu_stderr": 0.048795806087287424, "rouge1_fmeasure": 0.12333237651607433, "rouge1_fmeasure_stderr": 0.0018995495239739787, "rouge1_precision": 0.07936192579865504, "rouge1_precision_stderr": 0.0015426897773666887, "rouge1_recall": 0.3967228621080476, "rouge1_recall_stderr": 0.005035788052603314, "rouge2_fmeasure": 0.05685164611012959, "rouge2_fmeasure_stderr": 0.001193840199959299, "rouge2_precision": 0.0361795830053176, "rouge2_precision_stderr": 0.0008771942709925916, "rouge2_recall": 0.19495589680109515, "rouge2_recall_stderr": 0.0036179457975666733, "rougeL_fmeasure": 0.11262522353373274, "rougeL_fmeasure_stderr": 0.001668123718914031, "rougeL_precision": 0.07239948675670523, "rougeL_precision_stderr": 0.0013748540153599564, "rougeL_recall": 0.3637724702147103, "rougeL_recall_stderr": 0.004528167648238907, "rougeLsum_fmeasure": 0.11594403375103957, "rougeLsum_fmeasure_stderr": 0.0017604845749238877, "rougeLsum_precision": 0.07461562643114039, "rougeLsum_precision_stderr": 0.0014456314194904961, "rougeLsum_recall": 0.3734381336992152, "rougeLsum_recall_stderr": 0.004658729212112421}}, "5": {"PALM_prompt": {"bleu": 0.6348116381689767, "bleu_stderr": 0.025032005928245744, "rouge1_fmeasure": 0.12151531670936837, "rouge1_fmeasure_stderr": 0.0018013952412054407, "rouge1_precision": 0.07772480241459157, "rouge1_precision_stderr": 0.0014761937289481531, "rouge1_recall": 0.39775384294624816, "rouge1_recall_stderr": 0.005043126900140792, "rouge2_fmeasure": 0.05654046753025775, "rouge2_fmeasure_stderr": 0.0011574259112533843, "rouge2_precision": 0.03642686374060602, "rouge2_precision_stderr": 0.0010535500618274554, "rouge2_recall": 0.1954871545530622, "rouge2_recall_stderr": 0.0036330438060616513, "rougeL_fmeasure": 0.1106233752219019, "rougeL_fmeasure_stderr": 0.0016037607255517253, "rougeL_precision": 0.0708062283164349, "rougeL_precision_stderr": 0.0013339231845929654, "rougeL_recall": 0.3620745179558994, "rougeL_recall_stderr": 0.00449776594486043, "rougeLsum_fmeasure": 0.1140750876332385, "rougeLsum_fmeasure_stderr": 0.0016853800565220047, "rougeLsum_precision": 0.07304451504316123, "rougeLsum_precision_stderr": 0.0013879168010522463, "rougeLsum_recall": 0.37251915128720225, "rougeLsum_recall_stderr": 0.00464816980850311}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.7934141534025163, "bleu_stderr": 0.08383146848244837, "rouge1_fmeasure": 0.18760609214914972, "rouge1_fmeasure_stderr": 0.0018528010283896678, "rouge1_precision": 0.1603204965143781, "rouge1_precision_stderr": 0.0019055374186705493, "rouge1_recall": 0.273148053641277, "rouge1_recall_stderr": 0.00271429826551829, "rouge2_fmeasure": 0.039553536857052096, "rouge2_fmeasure_stderr": 0.0009080316883759782, "rouge2_precision": 0.03352653833860025, "rouge2_precision_stderr": 0.0008141842668329252, "rouge2_recall": 0.059532665192850664, "rouge2_recall_stderr": 0.001495886372304702, "rougeL_fmeasure": 0.14148134446020433, "rougeL_fmeasure_stderr": 0.001278578656113803, "rougeL_precision": 0.11956609361350197, "rougeL_precision_stderr": 0.001288770553600895, "rougeL_recall": 0.21092821240171705, "rougeL_recall_stderr": 0.002145023872994803, "rougeLsum_fmeasure": 0.17295948170907235, "rougeLsum_fmeasure_stderr": 0.0016989010001995553, "rougeLsum_precision": 0.1475742184322245, "rougeLsum_precision_stderr": 0.001744563798127783, "rougeLsum_recall": 0.25286325424170925, "rougeLsum_recall_stderr": 0.0025434557707113424}}, "1": {"tldr_en": {"bleu": 2.2027676863872756, "bleu_stderr": 0.07884539943019493, "rouge1_fmeasure": 0.20404111705603262, "rouge1_fmeasure_stderr": 0.0018961046573895371, "rouge1_precision": 0.1745195547370322, "rouge1_precision_stderr": 0.0020211127459286177, "rouge1_recall": 0.29756863851182014, "rouge1_recall_stderr": 0.002720442694533944, "rouge2_fmeasure": 0.04531387019112246, "rouge2_fmeasure_stderr": 0.0009454489412507513, "rouge2_precision": 0.038836287518126324, "rouge2_precision_stderr": 0.0008918673703720118, "rouge2_recall": 0.0678582672753382, "rouge2_recall_stderr": 0.0015726696869910164, "rougeL_fmeasure": 0.14662233559425056, "rougeL_fmeasure_stderr": 0.0012675330724451579, "rougeL_precision": 0.12403344533976053, "rougeL_precision_stderr": 0.0013370363902071867, "rougeL_recall": 0.21966745113211172, "rougeL_recall_stderr": 0.002148471848315497, "rougeLsum_fmeasure": 0.19031232879553658, "rougeLsum_fmeasure_stderr": 0.0017631603815569407, "rougeLsum_precision": 0.16262281802775871, "rougeLsum_precision_stderr": 0.0018832504839498365, "rougeLsum_recall": 0.2785759841913255, "rougeLsum_recall_stderr": 0.002586017885803777}}, "2": {"tldr_en": {"bleu": 2.3891366560914298, "bleu_stderr": 0.08062856329183088, "rouge1_fmeasure": 0.2078510077674295, "rouge1_fmeasure_stderr": 0.0018302477945332431, "rouge1_precision": 0.17812583517946007, "rouge1_precision_stderr": 0.002009945937748485, "rouge1_recall": 0.303539848216664, "rouge1_recall_stderr": 0.002638500102412918, "rouge2_fmeasure": 0.04667487755408923, "rouge2_fmeasure_stderr": 0.0009128949090939083, "rouge2_precision": 0.03988619638649071, "rouge2_precision_stderr": 0.0008528640674491505, "rouge2_recall": 0.07069101771037783, "rouge2_recall_stderr": 0.0015418058212234357, "rougeL_fmeasure": 0.14847289603046035, "rougeL_fmeasure_stderr": 0.0012287208530959888, "rougeL_precision": 0.1260062676909843, "rougeL_precision_stderr": 0.001364424629646694, "rougeL_recall": 0.22269555369572, "rougeL_recall_stderr": 0.002089758754681962, "rougeLsum_fmeasure": 0.1948747340586584, "rougeLsum_fmeasure_stderr": 0.0017076787007878865, "rougeLsum_precision": 0.16673210140327593, "rougeLsum_precision_stderr": 0.001876553104110706, "rougeLsum_recall": 0.28573976969483017, "rougeLsum_recall_stderr": 0.002520262824141778}}, "3": {"tldr_en": {"bleu": 2.38911546645986, "bleu_stderr": 0.07647894828583013, "rouge1_fmeasure": 0.17428261104968168, "rouge1_fmeasure_stderr": 0.0021443814628730523, "rouge1_precision": 0.15466504916141774, "rouge1_precision_stderr": 0.002308226402178308, "rouge1_recall": 0.2551520537583065, "rouge1_recall_stderr": 0.0032171951632609264, "rouge2_fmeasure": 0.03952258753236028, "rouge2_fmeasure_stderr": 0.0009033133825001278, "rouge2_precision": 0.03492860218651495, "rouge2_precision_stderr": 0.0009155361590863039, "rouge2_recall": 0.060501291725340245, "rouge2_recall_stderr": 0.001568003123293494, "rougeL_fmeasure": 0.12499242197529943, "rougeL_fmeasure_stderr": 0.0014791492005730253, "rougeL_precision": 0.11061065008297513, "rougeL_precision_stderr": 0.0016789233374586393, "rougeL_recall": 0.1885220916112058, "rougeL_recall_stderr": 0.002535325446834288, "rougeLsum_fmeasure": 0.16396063897113883, "rougeLsum_fmeasure_stderr": 0.0020097929828463102, "rougeLsum_precision": 0.1453452296219742, "rougeLsum_precision_stderr": 0.0021599240195076573, "rougeLsum_recall": 0.24088194688429895, "rougeLsum_recall_stderr": 0.00305926261571982}}, "4": {"tldr_en": {"bleu": 0.5396555354382301, "bleu_stderr": 0.03382350846346006, "rouge1_fmeasure": 0.056665547293806504, "rouge1_fmeasure_stderr": 0.001891719846577204, "rouge1_precision": 0.053018296777332476, "rouge1_precision_stderr": 0.001989950046503427, "rouge1_recall": 0.08596667050742965, "rouge1_recall_stderr": 0.002947649719879261, "rouge2_fmeasure": 0.013047921347416528, "rouge2_fmeasure_stderr": 0.0006398386351669672, "rouge2_precision": 0.011358703706930581, "rouge2_precision_stderr": 0.000600320864289757, "rouge2_recall": 0.021640340405918963, "rouge2_recall_stderr": 0.0011802802866629615, "rougeL_fmeasure": 0.04210570382315936, "rougeL_fmeasure_stderr": 0.001378676251875729, "rougeL_precision": 0.03957496787938521, "rougeL_precision_stderr": 0.0015124056846112217, "rougeL_recall": 0.06552651052204829, "rougeL_recall_stderr": 0.0022922651246891222, "rougeLsum_fmeasure": 0.05326532550449904, "rougeLsum_fmeasure_stderr": 0.0017732306920814024, "rougeLsum_precision": 0.049771628442206735, "rougeLsum_precision_stderr": 0.0018700031303863793, "rougeLsum_recall": 0.08106940347167176, "rougeLsum_recall_stderr": 0.0027897599646264986}}, "5": {"tldr_en": {"bleu": 6.626695028697088e-07, "bleu_stderr": 1.1951854876786307e-06, "rouge1_fmeasure": 0.008692457481160468, "rouge1_fmeasure_stderr": 0.0008227750799750827, "rouge1_precision": 0.008477708430630778, "rouge1_precision_stderr": 0.0008888303927431226, "rouge1_recall": 0.013378525794197375, "rouge1_recall_stderr": 0.0013202915810629089, "rouge2_fmeasure": 0.0020021672595433877, "rouge2_fmeasure_stderr": 0.0002655938544483011, "rouge2_precision": 0.002035592041182627, "rouge2_precision_stderr": 0.0003440486575723203, "rouge2_recall": 0.003334615800958582, "rouge2_recall_stderr": 0.0004964329628462136, "rougeL_fmeasure": 0.006455452264291404, "rougeL_fmeasure_stderr": 0.0006047126016011451, "rougeL_precision": 0.006368490138883737, "rougeL_precision_stderr": 0.0006824241585392732, "rougeL_recall": 0.010162399165178543, "rougeL_recall_stderr": 0.0010265436936400937, "rougeLsum_fmeasure": 0.008133155428782728, "rougeLsum_fmeasure_stderr": 0.0007677758628473678, "rougeLsum_precision": 0.007948184602390525, "rougeLsum_precision_stderr": 0.0008399495471791939, "rougeLsum_recall": 0.012575544635440476, "rougeLsum_recall_stderr": 0.0012445710338658724}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 2.878712808592603, "bleu_stderr": 0.0853866064382545, "rouge1_fmeasure": 0.14598569647435716, "rouge1_fmeasure_stderr": 0.0019257642313717281, "rouge1_precision": 0.12473936122211624, "rouge1_precision_stderr": 0.001798387415150618, "rouge1_recall": 0.21205919428582165, "rouge1_recall_stderr": 0.002854707525591281, "rouge2_fmeasure": 0.04387542635560367, "rouge2_fmeasure_stderr": 0.0010442399588521244, "rouge2_precision": 0.03495666955822184, "rouge2_precision_stderr": 0.0008687034534547671, "rouge2_recall": 0.06654649371061956, "rouge2_recall_stderr": 0.0016084812198622184, "rougeL_fmeasure": 0.13483368037365023, "rougeL_fmeasure_stderr": 0.0016578290285278543, "rougeL_precision": 0.11526993035626307, "rougeL_precision_stderr": 0.001545375812569594, "rougeL_recall": 0.19660657514045912, "rougeL_recall_stderr": 0.0025255577441268087, "rougeLsum_fmeasure": 0.12774057149590898, "rougeLsum_fmeasure_stderr": 0.0016934965354593117, "rougeLsum_precision": 0.10944292922104659, "rougeLsum_precision_stderr": 0.0015541855309834716, "rougeLsum_recall": 0.1856831740193031, "rougeLsum_recall_stderr": 0.0025479048755850213}}, "1": {"generate_text_restaurant": {"bleu": 9.756713461785154, "bleu_stderr": 0.1556457646527884, "rouge1_fmeasure": 0.40687267868315097, "rouge1_fmeasure_stderr": 0.0018487565527517862, "rouge1_precision": 0.4098430493296336, "rouge1_precision_stderr": 0.002322243350403215, "rouge1_recall": 0.44204106174129115, "rouge1_recall_stderr": 0.002648076916437811, "rouge2_fmeasure": 0.17029119687013236, "rouge2_fmeasure_stderr": 0.0015443604787036918, "rouge2_precision": 0.17194753805951837, "rouge2_precision_stderr": 0.0017305953745273977, "rouge2_recall": 0.18647781584399134, "rouge2_recall_stderr": 0.0018885402575458418, "rougeL_fmeasure": 0.28000012009488995, "rougeL_fmeasure_stderr": 0.0015606595580042648, "rougeL_precision": 0.28268352481109116, "rougeL_precision_stderr": 0.0019277807551157933, "rougeL_recall": 0.30476888259625023, "rougeL_recall_stderr": 0.0021362292770155254, "rougeLsum_fmeasure": 0.3345777715915075, "rougeLsum_fmeasure_stderr": 0.001819480989061025, "rougeLsum_precision": 0.33736408060377443, "rougeLsum_precision_stderr": 0.002189042828443897, "rougeLsum_recall": 0.3634133186767332, "rougeLsum_recall_stderr": 0.0024561816405961946}}, "2": {"generate_text_restaurant": {"bleu": 9.703365784320074, "bleu_stderr": 0.16108986784891388, "rouge1_fmeasure": 0.4101176075687606, "rouge1_fmeasure_stderr": 0.0018267883175402378, "rouge1_precision": 0.392092480268303, "rouge1_precision_stderr": 0.002302537065374289, "rouge1_recall": 0.4700929192938433, "rouge1_recall_stderr": 0.0025952785236860797, "rouge2_fmeasure": 0.1817582009151592, "rouge2_fmeasure_stderr": 0.001527895144436596, "rouge2_precision": 0.17385266696101637, "rouge2_precision_stderr": 0.0016739605455478718, "rouge2_recall": 0.21043725627335938, "rouge2_recall_stderr": 0.0019419833439951327, "rougeL_fmeasure": 0.2819491223195203, "rougeL_fmeasure_stderr": 0.0015219411814398627, "rougeL_precision": 0.2694278866213945, "rougeL_precision_stderr": 0.0018257757886672125, "rougeL_recall": 0.32463760826780586, "rougeL_recall_stderr": 0.0021411692643784116, "rougeLsum_fmeasure": 0.341970457946986, "rougeLsum_fmeasure_stderr": 0.0017909707229488067, "rougeLsum_precision": 0.32676135279841206, "rougeLsum_precision_stderr": 0.002119047445904341, "rougeLsum_recall": 0.3923976496945184, "rougeLsum_recall_stderr": 0.002451591838805565}}, "3": {"generate_text_restaurant": {"bleu": 9.761234651073966, "bleu_stderr": 0.08117964062807032, "rouge1_fmeasure": 0.4065423629912447, "rouge1_fmeasure_stderr": 0.001806841436683923, "rouge1_precision": 0.3769467510554381, "rouge1_precision_stderr": 0.00213141802058671, "rouge1_recall": 0.4783045642626352, "rouge1_recall_stderr": 0.0025707591897062483, "rouge2_fmeasure": 0.18366190818796568, "rouge2_fmeasure_stderr": 0.0015116466616384265, "rouge2_precision": 0.16918099441968293, "rouge2_precision_stderr": 0.0015053602189487548, "rouge2_recall": 0.21947419317279818, "rouge2_recall_stderr": 0.002013053097487535, "rougeL_fmeasure": 0.2817551356956864, "rougeL_fmeasure_stderr": 0.0015262712862237756, "rougeL_precision": 0.2607744983983079, "rougeL_precision_stderr": 0.0016830752871787188, "rougeL_recall": 0.3333300743221725, "rougeL_recall_stderr": 0.0021979974365264774, "rougeLsum_fmeasure": 0.34229547153938067, "rougeLsum_fmeasure_stderr": 0.001786413003034628, "rougeLsum_precision": 0.31727007213590536, "rougeLsum_precision_stderr": 0.001993439598512182, "rougeLsum_recall": 0.40307149877627624, "rougeLsum_recall_stderr": 0.002469750781351579}}, "4": {"generate_text_restaurant": {"bleu": 10.060481335729593, "bleu_stderr": 0.13006673690205298, "rouge1_fmeasure": 0.40925099639651336, "rouge1_fmeasure_stderr": 0.0018052362806663203, "rouge1_precision": 0.3804171250877555, "rouge1_precision_stderr": 0.0021190302719114127, "rouge1_recall": 0.4780703069260566, "rouge1_recall_stderr": 0.002533824939435917, "rouge2_fmeasure": 0.1863731784770829, "rouge2_fmeasure_stderr": 0.0015333517641007584, "rouge2_precision": 0.17221168629234665, "rouge2_precision_stderr": 0.0015253603947935756, "rouge2_recall": 0.2208989636456487, "rouge2_recall_stderr": 0.0020171225023131564, "rougeL_fmeasure": 0.28431779718263517, "rougeL_fmeasure_stderr": 0.0015550810673653737, "rougeL_precision": 0.26364753406030395, "rougeL_precision_stderr": 0.001681924883574724, "rougeL_recall": 0.3339558499615528, "rougeL_recall_stderr": 0.0022103390891101316, "rougeLsum_fmeasure": 0.3444533365407922, "rougeLsum_fmeasure_stderr": 0.0018019008736801165, "rougeLsum_precision": 0.32014456374564415, "rougeLsum_precision_stderr": 0.001994286539846333, "rougeLsum_recall": 0.40252942143619874, "rougeLsum_recall_stderr": 0.0024450797012346218}}, "5": {"generate_text_restaurant": {"bleu": 10.242478339458849, "bleu_stderr": 0.15925298363618348, "rouge1_fmeasure": 0.411488509635484, "rouge1_fmeasure_stderr": 0.0018020990796425748, "rouge1_precision": 0.3847914899421603, "rouge1_precision_stderr": 0.002183175369376523, "rouge1_recall": 0.4774457234022992, "rouge1_recall_stderr": 0.002464818162721772, "rouge2_fmeasure": 0.18753065960202087, "rouge2_fmeasure_stderr": 0.0015196039524377218, "rouge2_precision": 0.17466204582352918, "rouge2_precision_stderr": 0.0015530402332911797, "rouge2_recall": 0.22030265368490773, "rouge2_recall_stderr": 0.0019596071325407617, "rougeL_fmeasure": 0.2877066533447448, "rougeL_fmeasure_stderr": 0.0015722869589788488, "rougeL_precision": 0.2682876782077045, "rougeL_precision_stderr": 0.0017434660077252258, "rougeL_recall": 0.3357310111978014, "rougeL_recall_stderr": 0.0021781101054053217, "rougeLsum_fmeasure": 0.34582724571038975, "rougeLsum_fmeasure_stderr": 0.0018153943190470448, "rougeLsum_precision": 0.32327624212453093, "rougeLsum_precision_stderr": 0.0020620269813736254, "rougeLsum_recall": 0.4015164129730794, "rougeLsum_recall_stderr": 0.0024008264881823175}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.9895418658955089, "bleu_stderr": 0.058791202685981404, "rouge1_fmeasure": 0.21561062837939882, "rouge1_fmeasure_stderr": 0.0023994286403233862, "rouge1_precision": 0.15562575636638382, "rouge1_precision_stderr": 0.0018985685959581433, "rouge1_recall": 0.37071290923313827, "rouge1_recall_stderr": 0.00412806450314426, "rouge2_fmeasure": 0.04992047712716468, "rouge2_fmeasure_stderr": 0.0015659162879365486, "rouge2_precision": 0.035854646948925664, "rouge2_precision_stderr": 0.0011959015024675783, "rouge2_recall": 0.08777720514933714, "rouge2_recall_stderr": 0.0028093393672125244, "rougeL_fmeasure": 0.15823496005416243, "rougeL_fmeasure_stderr": 0.0018701288881012726, "rougeL_precision": 0.11410361066824068, "rougeL_precision_stderr": 0.0014883650475830462, "rougeL_recall": 0.27352828928489664, "rougeL_recall_stderr": 0.0033358267453375847, "rougeLsum_fmeasure": 0.17227583896279217, "rougeLsum_fmeasure_stderr": 0.0020612622488592977, "rougeLsum_precision": 0.12411547049969442, "rougeLsum_precision_stderr": 0.0016095217901991009, "rougeLsum_recall": 0.29756544693353426, "rougeLsum_recall_stderr": 0.0036531260756102256}}, "1": {"article_DOC_summary": {"bleu": 1.22504315109096, "bleu_stderr": 0.09308335353980157, "rouge1_fmeasure": 0.17500466633779274, "rouge1_fmeasure_stderr": 0.002369834619717104, "rouge1_precision": 0.12450251214516139, "rouge1_precision_stderr": 0.0017701644559474019, "rouge1_recall": 0.3066220711240498, "rouge1_recall_stderr": 0.004028698629097141, "rouge2_fmeasure": 0.03174368690811647, "rouge2_fmeasure_stderr": 0.0013089569557441355, "rouge2_precision": 0.022425235776437836, "rouge2_precision_stderr": 0.0009260101083179589, "rouge2_recall": 0.05660716486590679, "rouge2_recall_stderr": 0.0023949778530059774, "rougeL_fmeasure": 0.13160921880048357, "rougeL_fmeasure_stderr": 0.0017477071878516516, "rougeL_precision": 0.09339225179828282, "rougeL_precision_stderr": 0.0012872208930509489, "rougeL_recall": 0.23225364174357402, "rougeL_recall_stderr": 0.003121701045125992, "rougeLsum_fmeasure": 0.14248813343338157, "rougeLsum_fmeasure_stderr": 0.001971817720719966, "rougeLsum_precision": 0.10120518962461963, "rougeLsum_precision_stderr": 0.0014558021924337414, "rougeLsum_recall": 0.2508945472267905, "rougeLsum_recall_stderr": 0.0034731782884289226}}, "2": {"article_DOC_summary": {"bleu": 1.298794808823118, "bleu_stderr": 0.09705115916767015, "rouge1_fmeasure": 0.17365706390997016, "rouge1_fmeasure_stderr": 0.0023744297279891893, "rouge1_precision": 0.1234862615247332, "rouge1_precision_stderr": 0.001784653293189628, "rouge1_recall": 0.3044465438832426, "rouge1_recall_stderr": 0.003981514741893442, "rouge2_fmeasure": 0.03153224014629812, "rouge2_fmeasure_stderr": 0.00132441371576198, "rouge2_precision": 0.02226790525553246, "rouge2_precision_stderr": 0.000942452403285749, "rouge2_recall": 0.056422620727974965, "rouge2_recall_stderr": 0.0024200696931415224, "rougeL_fmeasure": 0.13213102627357046, "rougeL_fmeasure_stderr": 0.0017809957835749522, "rougeL_precision": 0.09368957768118093, "rougeL_precision_stderr": 0.0013169064303781464, "rougeL_recall": 0.23355487572465355, "rougeL_recall_stderr": 0.0031690210056585975, "rougeLsum_fmeasure": 0.14132095054221017, "rougeLsum_fmeasure_stderr": 0.0019853871709270238, "rougeLsum_precision": 0.10021625167450877, "rougeLsum_precision_stderr": 0.001468880768310731, "rougeLsum_recall": 0.24963190949674946, "rougeLsum_recall_stderr": 0.0034860586627063653}}, "3": {"article_DOC_summary": {"bleu": 1.3205278027479164, "bleu_stderr": 0.09561115002496487, "rouge1_fmeasure": 0.16354635610802612, "rouge1_fmeasure_stderr": 0.0024663949649927435, "rouge1_precision": 0.11844914382273448, "rouge1_precision_stderr": 0.0019201993243810158, "rouge1_recall": 0.28390135387162757, "rouge1_recall_stderr": 0.004220868188703738, "rouge2_fmeasure": 0.029556549223572853, "rouge2_fmeasure_stderr": 0.0012888784997271304, "rouge2_precision": 0.02107624492911234, "rouge2_precision_stderr": 0.000925135660801624, "rouge2_recall": 0.05264382125378585, "rouge2_recall_stderr": 0.0023516589207668815, "rougeL_fmeasure": 0.12619122655248322, "rougeL_fmeasure_stderr": 0.0018579466532603177, "rougeL_precision": 0.09104582658177605, "rougeL_precision_stderr": 0.0014168096722186306, "rougeL_recall": 0.22075959991016572, "rougeL_recall_stderr": 0.003328818909079906, "rougeLsum_fmeasure": 0.1324788344627292, "rougeLsum_fmeasure_stderr": 0.0020440661672023576, "rougeLsum_precision": 0.09565182333428005, "rougeLsum_precision_stderr": 0.001567884974278684, "rougeLsum_recall": 0.23135719936282417, "rougeLsum_recall_stderr": 0.0035958537292906803}}, "4": {"article_DOC_summary": {"bleu": 0.6426176499265798, "bleu_stderr": 0.10944172884159943, "rouge1_fmeasure": 0.046239903656618994, "rouge1_fmeasure_stderr": 0.002631695063266343, "rouge1_precision": 0.039205474045436915, "rouge1_precision_stderr": 0.0025102333275441356, "rouge1_recall": 0.07293349387654642, "rouge1_recall_stderr": 0.004216797737450448, "rouge2_fmeasure": 0.008394359766787172, "rouge2_fmeasure_stderr": 0.0008212624322810702, "rouge2_precision": 0.0065884676077519935, "rouge2_precision_stderr": 0.0006855012194927015, "rouge2_recall": 0.01391800911864852, "rouge2_recall_stderr": 0.0014107292938298562, "rougeL_fmeasure": 0.034807968155924324, "rougeL_fmeasure_stderr": 0.001962639728158149, "rougeL_precision": 0.030224247701060337, "rougeL_precision_stderr": 0.0020534035064510973, "rougeL_recall": 0.05511074735500151, "rougeL_recall_stderr": 0.0031931944384416162, "rougeLsum_fmeasure": 0.03760898789185391, "rougeLsum_fmeasure_stderr": 0.002134288615760715, "rougeLsum_precision": 0.03234508109476721, "rougeLsum_precision_stderr": 0.002152956064622564, "rougeLsum_recall": 0.059639154094017835, "rougeLsum_recall_stderr": 0.0034861307417076055}}, "5": {"article_DOC_summary": {"bleu": 5.88065686206085e-38, "bleu_stderr": 3.723633937038377e-32, "rouge1_fmeasure": 0.001882160171017921, "rouge1_fmeasure_stderr": 0.0005176393078664199, "rouge1_precision": 0.0021575243350025752, "rouge1_precision_stderr": 0.0006054243071962044, "rouge1_recall": 0.001704266236696643, "rouge1_recall_stderr": 0.0004652377643070007, "rouge2_fmeasure": 0.000263097920800064, "rouge2_fmeasure_stderr": 0.00010803201929354118, "rouge2_precision": 0.0003161470420071974, "rouge2_precision_stderr": 0.00012902342640180555, "rouge2_recall": 0.00022809737432378943, "rouge2_recall_stderr": 9.478510684431686e-05, "rougeL_fmeasure": 0.0014623646787355947, "rougeL_fmeasure_stderr": 0.00041204303295078344, "rougeL_precision": 0.0016748107867624196, "rougeL_precision_stderr": 0.0004791518665809304, "rougeL_recall": 0.00132498621769639, "rougeL_recall_stderr": 0.0003711043260363234, "rougeLsum_fmeasure": 0.0015022545826009262, "rougeLsum_fmeasure_stderr": 0.00042147455797712205, "rougeLsum_precision": 0.0017284128450814592, "rougeLsum_precision_stderr": 0.000493769341153888, "rougeLsum_recall": 0.0013567504004039692, "rougeLsum_recall_stderr": 0.0003777491879943449}}}} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..25c9ce99a139a5c1636ab2a0b9dfd2221980c5f0 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4505969912144358, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.043025981663977676 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07715680688754782, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018501494099723034 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.32800192332635164, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.004716290361046614 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11475949399291512, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020930584454703313 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03691606942766564, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001226252004533247 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15714130080850514, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003275285581951961 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05421096419841178, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013323602620276317 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07330043188559601, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016882205517441595 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.31747468696171116, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004607770796206798 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1095828810892153, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019205919592418358 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07264308016772093, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001734436368694926 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.30915040739896027, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004387887182362267 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10804953744361874, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0019462325362491339 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..6ff0e2583470e02473bb68ed6395a04da55d8116 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5248973715012223, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.04500340113008066 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0790761668773179, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0016843496475256363 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3697333749180133, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005009866939283317 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12116080004166574, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002034248506156313 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03678510490686299, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001081873045114326 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17843660776062029, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003489215109878396 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05647199175457009, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013066532545353317 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07404916365054973, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015255606390290489 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.34923402691643046, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004687346760287558 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11376961245179681, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018264898168477456 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07445381060380506, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001593181333906948 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3467160374634341, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004579407380382054 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11395978695320426, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018994693226140945 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2b50b5b3ffc13d67456f35e0a886e4592c97f9ce --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5767647931281593, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03075444324731624 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08030107100423996, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015674832760453747 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.38840421585850693, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005175482568072094 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12441199271565954, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001979354566482751 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.037112804584329, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009141020328534724 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19070965082945687, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003653414412934534 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.057979391263589294, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012537328703996166 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07384535953637529, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013915854560762077 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3595423504669609, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00473567632900781 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11464846086222981, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017509905495136865 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07564699950143948, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014680313985962644 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3655854110990312, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0047861725768252785 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11714224514649191, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018352989430204284 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f3fc77074d6ae9ed9ec85ca4d28319ffbfbe0994 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6551242086874565, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03786184470041364 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07882570317453028, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015398380099203338 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39347312457818545, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005115592107070138 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12253462963491722, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019458379147742845 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0365856093502546, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009020386358581405 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19448869036942362, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036911175236007915 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05738575356669148, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012433710684840093 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07184479663593357, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013555990593936752 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.36011891059508755, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004569680331874904 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11178706827138284, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016888026831589167 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07401320225138429, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001446688093860126 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3682561684373326, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004661037301261206 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11492232075242285, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018044818590991203 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0fc7cff81981b2a7908b967a039677d4c6ac68b9 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6361569019073665, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.048795806087287424 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07936192579865504, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015426897773666887 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3967228621080476, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005035788052603314 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12333237651607433, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018995495239739787 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0361795830053176, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008771942709925916 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19495589680109515, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036179457975666733 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05685164611012959, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001193840199959299 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07239948675670523, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013748540153599564 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3637724702147103, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004528167648238907 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11262522353373274, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001668123718914031 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07461562643114039, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014456314194904961 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3734381336992152, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004658729212112421 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11594403375103957, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017604845749238877 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..26132c4a4baa673c2c1b099dc1380ac184b1d0ca --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6348116381689767, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.025032005928245744 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07772480241459157, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014761937289481531 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39775384294624816, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005043126900140792 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12151531670936837, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018013952412054407 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03642686374060602, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010535500618274554 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1954871545530622, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036330438060616513 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05654046753025775, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011574259112533843 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0708062283164349, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013339231845929654 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3620745179558994, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00449776594486043 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1106233752219019, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016037607255517253 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07304451504316123, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013879168010522463 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.37251915128720225, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00464816980850311 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1140750876332385, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016853800565220047 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..7ff10e272a05b0981e76cc32e806734bf78c1ca0 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1603204965143781, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019055374186705493 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.273148053641277, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00271429826551829 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18760609214914972, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018528010283896678 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03352653833860025, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008141842668329252 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.059532665192850664, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001495886372304702 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.039553536857052096, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009080316883759782 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11956609361350197, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001288770553600895 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21092821240171705, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002145023872994803 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14148134446020433, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001278578656113803 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1475742184322245, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001744563798127783 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.25286325424170925, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025434557707113424 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.17295948170907235, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016989010001995553 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.7934141534025163, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08383146848244837 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..5c6f0846a956b0857716cd1935eac190c5942a8c --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1745195547370322, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0020211127459286177 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.29756863851182014, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002720442694533944 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.20404111705603262, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018961046573895371 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.038836287518126324, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008918673703720118 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0678582672753382, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015726696869910164 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04531387019112246, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009454489412507513 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12403344533976053, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013370363902071867 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21966745113211172, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002148471848315497 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14662233559425056, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012675330724451579 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.16262281802775871, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018832504839498365 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2785759841913255, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002586017885803777 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.19031232879553658, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017631603815569407 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.2027676863872756, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07884539943019493 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..e482253a1ac2513a756af2c2a5ae894043b46431 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.17812583517946007, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002009945937748485 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.303539848216664, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002638500102412918 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.2078510077674295, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018302477945332431 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03988619638649071, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008528640674491505 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07069101771037783, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015418058212234357 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04667487755408923, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009128949090939083 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1260062676909843, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001364424629646694 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22269555369572, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002089758754681962 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14847289603046035, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012287208530959888 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.16673210140327593, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001876553104110706 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.28573976969483017, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002520262824141778 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1948747340586584, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017076787007878865 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.3891366560914298, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08062856329183088 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..77fc84cb4cd249e9f497e5c3e4c5e51acdfc8310 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15466504916141774, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.002308226402178308 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2551520537583065, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032171951632609264 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17428261104968168, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0021443814628730523 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03492860218651495, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009155361590863039 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.060501291725340245, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001568003123293494 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.03952258753236028, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009033133825001278 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11061065008297513, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0016789233374586393 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.1885220916112058, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002535325446834288 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12499242197529943, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014791492005730253 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1453452296219742, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0021599240195076573 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24088194688429895, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.00305926261571982 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16396063897113883, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020097929828463102 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.38911546645986, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07647894828583013 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..d6a7da4aaf79bd54d3918fc214c866889e9c9217 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.053018296777332476, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001989950046503427 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08596667050742965, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002947649719879261 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.056665547293806504, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001891719846577204 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.011358703706930581, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000600320864289757 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.021640340405918963, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0011802802866629615 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.013047921347416528, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0006398386351669672 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.03957496787938521, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015124056846112217 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.06552651052204829, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022922651246891222 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04210570382315936, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001378676251875729 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.049771628442206735, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018700031303863793 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.08106940347167176, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027897599646264986 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.05326532550449904, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017732306920814024 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.5396555354382301, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03382350846346006 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..4a6798c66ed2800a181c300eacb912e94dfee430 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.008477708430630778, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008888303927431226 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.013378525794197375, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0013202915810629089 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.008692457481160468, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008227750799750827 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.002035592041182627, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0003440486575723203 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.003334615800958582, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0004964329628462136 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0020021672595433877, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0002655938544483011 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006368490138883737, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0006824241585392732 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010162399165178543, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0010265436936400937 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006455452264291404, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006047126016011451 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.007948184602390525, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0008399495471791939 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.012575544635440476, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0012445710338658724 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008133155428782728, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007677758628473678 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 6.626695028697088e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.1951854876786307e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..042b7e72ce2b50b8218961d686c8511021dca662 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 2.878712808592603, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.0853866064382545 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.12473936122211624, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.001798387415150618 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.21205919428582165, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002854707525591281 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.14598569647435716, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0019257642313717281 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.03495666955822184, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0008687034534547671 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.06654649371061956, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0016084812198622184 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.04387542635560367, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0010442399588521244 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.11526993035626307, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.001545375812569594 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.19660657514045912, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0025255577441268087 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.13483368037365023, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016578290285278543 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.10944292922104659, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0015541855309834716 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.1856831740193031, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025479048755850213 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.12774057149590898, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016934965354593117 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..5b222f71963be05b3df4ea95a030750b13797ea0 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.756713461785154, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1556457646527884 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4098430493296336, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002322243350403215 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.44204106174129115, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002648076916437811 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.40687267868315097, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018487565527517862 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.17194753805951837, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0017305953745273977 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.18647781584399134, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0018885402575458418 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.17029119687013236, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0015443604787036918 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.28268352481109116, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0019277807551157933 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.30476888259625023, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0021362292770155254 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.28000012009488995, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015606595580042648 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.33736408060377443, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002189042828443897 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3634133186767332, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0024561816405961946 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3345777715915075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001819480989061025 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..90819a6560f3af5cd10ca4149e560857e5ccc080 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.703365784320074, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.16108986784891388 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.392092480268303, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002302537065374289 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4700929192938433, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025952785236860797 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4101176075687606, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018267883175402378 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.17385266696101637, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0016739605455478718 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21043725627335938, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019419833439951327 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1817582009151592, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001527895144436596 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2694278866213945, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0018257757886672125 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.32463760826780586, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0021411692643784116 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2819491223195203, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015219411814398627 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.32676135279841206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002119047445904341 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3923976496945184, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002451591838805565 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.341970457946986, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017909707229488067 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..69de98d7a67a719a8cb91535391b8681893ac5ad --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.761234651073966, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.08117964062807032 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3769467510554381, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.00213141802058671 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4783045642626352, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0025707591897062483 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4065423629912447, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.001806841436683923 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.16918099441968293, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0015053602189487548 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.21947419317279818, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002013053097487535 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.18366190818796568, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0015116466616384265 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2607744983983079, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0016830752871787188 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3333300743221725, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0021979974365264774 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2817551356956864, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015262712862237756 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.31727007213590536, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.001993439598512182 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40307149877627624, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002469750781351579 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.34229547153938067, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001786413003034628 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ceaec7d9e442cdef8f141de5ce279a7778d5f3d5 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.060481335729593, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.13006673690205298 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3804171250877555, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0021190302719114127 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4780703069260566, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002533824939435917 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.40925099639651336, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018052362806663203 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.17221168629234665, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0015253603947935756 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2208989636456487, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020171225023131564 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1863731784770829, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0015333517641007584 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.26364753406030395, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.001681924883574724 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3339558499615528, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022103390891101316 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.28431779718263517, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015550810673653737 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.32014456374564415, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.001994286539846333 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.40252942143619874, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0024450797012346218 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3444533365407922, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018019008736801165 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..c7115b06f465967e0b783f6f93777b1629bad7ee --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 10.242478339458849, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.15925298363618348 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3847914899421603, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.002183175369376523 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4774457234022992, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002464818162721772 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.411488509635484, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0018020990796425748 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.17466204582352918, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0015530402332911797 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22030265368490773, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019596071325407617 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.18753065960202087, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0015196039524377218 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2682876782077045, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0017434660077252258 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3357310111978014, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0021781101054053217 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2877066533447448, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0015722869589788488 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.32327624212453093, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0020620269813736254 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.4015164129730794, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0024008264881823175 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.34582724571038975, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018153943190470448 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_0.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..84fe6a8dd82c0350de8b7dd7693c2514b8f2ad97 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.15562575636638382, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018985685959581433 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.37071290923313827, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00412806450314426 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.21561062837939882, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0023994286403233862 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.035854646948925664, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0011959015024675783 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.08777720514933714, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0028093393672125244 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04992047712716468, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015659162879365486 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.11410361066824068, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014883650475830462 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.27352828928489664, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033358267453375847 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.15823496005416243, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018701288881012726 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.12411547049969442, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016095217901991009 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.29756544693353426, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036531260756102256 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.17227583896279217, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020612622488592977 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.9895418658955089, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.058791202685981404 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_1.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..3fc9bb3aa75cf0a92e2e1d7dae87d6fbbffd9447 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12450251214516139, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017701644559474019 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3066220711240498, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004028698629097141 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17500466633779274, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002369834619717104 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.022425235776437836, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009260101083179589 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05660716486590679, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0023949778530059774 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03174368690811647, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0013089569557441355 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09339225179828282, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0012872208930509489 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23225364174357402, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003121701045125992 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13160921880048357, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017477071878516516 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10120518962461963, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014558021924337414 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.2508945472267905, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034731782884289226 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14248813343338157, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.001971817720719966 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.22504315109096, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09308335353980157 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_2.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2ff152d1e6d49df7deec401362328442b588268a --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1234862615247332, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001784653293189628 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3044465438832426, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003981514741893442 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17365706390997016, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0023744297279891893 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02226790525553246, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.000942452403285749 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.056422620727974965, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0024200696931415224 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03153224014629812, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00132441371576198 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09368957768118093, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013169064303781464 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23355487572465355, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0031690210056585975 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13213102627357046, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017809957835749522 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.10021625167450877, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001468880768310731 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24963190949674946, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034860586627063653 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.14132095054221017, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019853871709270238 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.298794808823118, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09705115916767015 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_3.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..2a9ce43418e6961576427e2c0417d173e1aba79c --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11844914382273448, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0019201993243810158 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.28390135387162757, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004220868188703738 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.16354635610802612, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0024663949649927435 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.02107624492911234, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.000925135660801624 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05264382125378585, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0023516589207668815 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.029556549223572853, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012888784997271304 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09104582658177605, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014168096722186306 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.22075959991016572, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003328818909079906 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12619122655248322, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018579466532603177 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09565182333428005, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.001567884974278684 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23135719936282417, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035958537292906803 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1324788344627292, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020440661672023576 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.3205278027479164, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09561115002496487 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_4.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9a03539ecc5cb3d600b6812249cf966f08904cba --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.039205474045436915, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0025102333275441356 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.07293349387654642, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004216797737450448 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.046239903656618994, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002631695063266343 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0065884676077519935, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0006855012194927015 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.01391800911864852, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0014107292938298562 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.008394359766787172, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0008212624322810702 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.030224247701060337, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0020534035064510973 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.05511074735500151, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0031931944384416162 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.034807968155924324, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001962639728158149 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.03234508109476721, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002152956064622564 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.059639154094017835, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034861307417076055 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03760898789185391, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002134288615760715 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.6426176499265798, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.10944172884159943 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_5.json b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..7f90868bb6d2c0e42780a9d1d433aa72c06652d7 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/generation/slim.4b284b6bc4seed2_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.0021575243350025752, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0006054243071962044 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.001704266236696643, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0004652377643070007 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.001882160171017921, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0005176393078664199 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0003161470420071974, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00012902342640180555 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00022809737432378943, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 9.478510684431686e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.000263097920800064, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.00010803201929354118 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0016748107867624196, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0004791518665809304 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.00132498621769639, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0003711043260363234 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0014623646787355947, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00041204303295078344 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0017284128450814592, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.000493769341153888 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0013567504004039692, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0003777491879943449 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0015022545826009262, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.00042147455797712205 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 5.88065686206085e-38, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 3.723633937038377e-32 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed2/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_0.csv b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..6599ae83c72857ecfd2fcec2b6562a4e8257d3aa --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.339,0.014976758771620344,0 +anli_r2,acc,0.332,0.01489959724281148,0 +anli_r3,acc,0.35,0.013774667009018554,0 +arc_challenge,acc,0.2593856655290102,0.01280827357392711,0 +arc_challenge,acc_norm,0.29180887372013653,0.013284525292403508,0 +arc_easy,acc,0.5715488215488216,0.010154195733990958,0 +arc_easy,acc_norm,0.5138888888888888,0.010255824507190347,0 +boolq,acc,0.590519877675841,0.008600549751320912,1 +cb,acc,0.4107142857142857,0.06633634150359541,1 +cb,f1,0.3433862433862434,,1 +copa,acc,0.77,0.04229525846816506,0 +hellaswag,acc,0.4585739892451703,0.004972625848702654,0 +hellaswag,acc_norm,0.599681338378809,0.004889615413144211,0 +piqa,acc,0.7372143634385201,0.010269354068140767,0 +piqa,acc_norm,0.7486398258977149,0.010121156016819252,0 +rte,acc,0.5631768953068592,0.02985524739031495,0 +sciq,acc,0.805,0.012535235623319324,0 +sciq,acc_norm,0.72,0.014205696104091505,0 +storycloze_2016,acc,0.7087119187600214,0.010506919924163607,0 +winogrande,acc,0.5619573796369376,0.013944181296470804,0 diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_0.json b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_0.json new file mode 100644 index 0000000000000000000000000000000000000000..a74e6a5b98a1411481b24e8dc07ab099fe3d38c6 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.339, + "acc_stderr": 0.014976758771620344 + }, + "anli_r2": { + "acc": 0.332, + "acc_stderr": 0.01489959724281148 + }, + "anli_r3": { + "acc": 0.35, + "acc_stderr": 0.013774667009018554 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.3433862433862434 + }, + "copa": { + "acc": 0.77, + "acc_stderr": 0.04229525846816506 + }, + "hellaswag": { + "acc": 0.4585739892451703, + "acc_stderr": 0.004972625848702654, + "acc_norm": 0.599681338378809, + "acc_norm_stderr": 0.004889615413144211 + }, + "rte": { + "acc": 0.5631768953068592, + "acc_stderr": 0.02985524739031495 + }, + "winogrande": { + "acc": 0.5619573796369376, + "acc_stderr": 0.013944181296470804 + }, + "storycloze_2016": { + "acc": 0.7087119187600214, + "acc_stderr": 0.010506919924163607 + }, + "boolq": { + "acc": 0.590519877675841, + "acc_stderr": 0.008600549751320912 + }, + "arc_easy": { + "acc": 0.5715488215488216, + "acc_stderr": 0.010154195733990958, + "acc_norm": 0.5138888888888888, + "acc_norm_stderr": 0.010255824507190347 + }, + "arc_challenge": { + "acc": 0.2593856655290102, + "acc_stderr": 0.01280827357392711, + "acc_norm": 0.29180887372013653, + "acc_norm_stderr": 0.013284525292403508 + }, + "sciq": { + "acc": 0.805, + "acc_stderr": 0.012535235623319324, + "acc_norm": 0.72, + "acc_norm_stderr": 0.014205696104091505 + }, + "piqa": { + "acc": 0.7372143634385201, + "acc_stderr": 0.010269354068140767, + "acc_norm": 0.7486398258977149, + "acc_norm_stderr": 0.010121156016819252 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_1.csv b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..fd3cd42591ba8ee4e3c2e1f2e990a72ce4941c26 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.342,0.01500870618212173,0 +anli_r2,acc,0.312,0.014658474370509012,0 +anli_r3,acc,0.3358333333333333,0.013639261190932884,0 +arc_challenge,acc,0.2764505119453925,0.013069662474252428,0 +arc_challenge,acc_norm,0.29180887372013653,0.013284525292403508,0 +arc_easy,acc,0.5749158249158249,0.010143966195717849,0 +arc_easy,acc_norm,0.5378787878787878,0.01023029962886481,0 +boolq,acc,0.5886850152905199,0.008606395426309213,1 +cb,acc,0.44642857142857145,0.067031892279424,1 +cb,f1,0.3282216841538876,,1 +copa,acc,0.78,0.04163331998932261,0 +hellaswag,acc,0.46036646086436966,0.004974080638364265,0 +hellaswag,acc_norm,0.5976897032463653,0.004893617014975305,0 +piqa,acc,0.7448313384113167,0.01017157159252182,0 +piqa,acc_norm,0.7557127312295974,0.01002476517228425,0 +rte,acc,0.516245487364621,0.030080573208738064,0 +sciq,acc,0.851,0.011266140684632176,0 +sciq,acc_norm,0.823,0.012075463420375061,0 +storycloze_2016,acc,0.703901656867985,0.01055730768847513,0 +winogrande,acc,0.5619573796369376,0.013944181296470803,0 diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_1.json b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_1.json new file mode 100644 index 0000000000000000000000000000000000000000..cb7f2c7eaac1ec68769b95e862696737dd88fe09 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.342, + "acc_stderr": 0.01500870618212173 + }, + "anli_r2": { + "acc": 0.312, + "acc_stderr": 0.014658474370509012 + }, + "anli_r3": { + "acc": 0.3358333333333333, + "acc_stderr": 0.013639261190932884 + }, + "cb": { + "acc": 0.44642857142857145, + "acc_stderr": 0.067031892279424, + "f1": 0.3282216841538876 + }, + "copa": { + "acc": 0.78, + "acc_stderr": 0.04163331998932261 + }, + "hellaswag": { + "acc": 0.46036646086436966, + "acc_stderr": 0.004974080638364265, + "acc_norm": 0.5976897032463653, + "acc_norm_stderr": 0.004893617014975305 + }, + "rte": { + "acc": 0.516245487364621, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5619573796369376, + "acc_stderr": 0.013944181296470803 + }, + "storycloze_2016": { + "acc": 0.703901656867985, + "acc_stderr": 0.01055730768847513 + }, + "boolq": { + "acc": 0.5886850152905199, + "acc_stderr": 0.008606395426309213 + }, + "arc_easy": { + "acc": 0.5749158249158249, + "acc_stderr": 0.010143966195717849, + "acc_norm": 0.5378787878787878, + "acc_norm_stderr": 0.01023029962886481 + }, + "arc_challenge": { + "acc": 0.2764505119453925, + "acc_stderr": 0.013069662474252428, + "acc_norm": 0.29180887372013653, + "acc_norm_stderr": 0.013284525292403508 + }, + "sciq": { + "acc": 0.851, + "acc_stderr": 0.011266140684632176, + "acc_norm": 0.823, + "acc_norm_stderr": 0.012075463420375061 + }, + "piqa": { + "acc": 0.7448313384113167, + "acc_stderr": 0.01017157159252182, + "acc_norm": 0.7557127312295974, + "acc_norm_stderr": 0.01002476517228425 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_2.csv b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..a385664e71e465da072d0e5de8f2b51813ba6f3f --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.337,0.01495508791865361,0 +anli_r2,acc,0.346,0.01505026612756444,0 +anli_r3,acc,0.3383333333333333,0.013664144006618271,0 +arc_challenge,acc,0.2687713310580205,0.01295506596371069,0 +arc_challenge,acc_norm,0.3054607508532423,0.013460080478002503,0 +arc_easy,acc,0.5904882154882155,0.010090368160990059,0 +arc_easy,acc_norm,0.5585016835016835,0.01018931438274992,0 +boolq,acc,0.5944954128440367,0.008587459055441612,1 +cb,acc,0.42857142857142855,0.06672848092813058,1 +cb,f1,0.29690346083788705,,1 +copa,acc,0.76,0.042923469599092816,0 +hellaswag,acc,0.45807608046205933,0.004972210244020576,0 +hellaswag,acc_norm,0.6032662816172077,0.004882200364432357,0 +piqa,acc,0.7442872687704026,0.010178690109459858,0 +piqa,acc_norm,0.7426550598476604,0.010199921064792509,0 +rte,acc,0.4404332129963899,0.02988212336311872,0 +sciq,acc,0.879,0.010318210380946088,0 +sciq,acc_norm,0.846,0.011419913065098692,0 +storycloze_2016,acc,0.6990913949759487,0.010606289538707346,0 +winogrande,acc,0.5674822415153907,0.013923911578623833,0 diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_2.json b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_2.json new file mode 100644 index 0000000000000000000000000000000000000000..eb755fa322b4e6058426fe5d5e9e7d847aa29556 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.337, + "acc_stderr": 0.01495508791865361 + }, + "anli_r2": { + "acc": 0.346, + "acc_stderr": 0.01505026612756444 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.013664144006618271 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.29690346083788705 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.042923469599092816 + }, + "hellaswag": { + "acc": 0.45807608046205933, + "acc_stderr": 0.004972210244020576, + "acc_norm": 0.6032662816172077, + "acc_norm_stderr": 0.004882200364432357 + }, + "rte": { + "acc": 0.4404332129963899, + "acc_stderr": 0.02988212336311872 + }, + "winogrande": { + "acc": 0.5674822415153907, + "acc_stderr": 0.013923911578623833 + }, + "storycloze_2016": { + "acc": 0.6990913949759487, + "acc_stderr": 0.010606289538707346 + }, + "boolq": { + "acc": 0.5944954128440367, + "acc_stderr": 0.008587459055441612 + }, + "arc_easy": { + "acc": 0.5904882154882155, + "acc_stderr": 0.010090368160990059, + "acc_norm": 0.5585016835016835, + "acc_norm_stderr": 0.01018931438274992 + }, + "arc_challenge": { + "acc": 0.2687713310580205, + "acc_stderr": 0.01295506596371069, + "acc_norm": 0.3054607508532423, + "acc_norm_stderr": 0.013460080478002503 + }, + "sciq": { + "acc": 0.879, + "acc_stderr": 0.010318210380946088, + "acc_norm": 0.846, + "acc_norm_stderr": 0.011419913065098692 + }, + "piqa": { + "acc": 0.7442872687704026, + "acc_stderr": 0.010178690109459858, + "acc_norm": 0.7426550598476604, + "acc_norm_stderr": 0.010199921064792509 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_3.csv b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..501ab2f8f09c62d8fee3aabb5a410c1958520219 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.339,0.014976758771620344,0 +anli_r2,acc,0.357,0.01515852172148677,0 +anli_r3,acc,0.3383333333333333,0.013664144006618268,0 +arc_challenge,acc,0.27986348122866894,0.013119040897725922,0 +arc_challenge,acc_norm,0.30119453924914674,0.013406741767847626,0 +arc_easy,acc,0.5879629629629629,0.01009976585756276,0 +arc_easy,acc_norm,0.5606060606060606,0.010184134315437663,0 +boolq,acc,0.6039755351681957,0.00855388133681342,1 +cb,acc,0.48214285714285715,0.0673769750864465,1 +cb,f1,0.3707141840944658,,1 +copa,acc,0.79,0.040936018074033256,0 +hellaswag,acc,0.46036646086436966,0.0049740806383642665,0 +hellaswag,acc_norm,0.6047600079665405,0.004879030010598914,0 +piqa,acc,0.7486398258977149,0.01012115601681926,0 +piqa,acc_norm,0.7475516866158868,0.010135665547362355,0 +rte,acc,0.5126353790613718,0.030086851767188564,0 +sciq,acc,0.873,0.010534798620855752,0 +sciq,acc_norm,0.851,0.011266140684632163,0 +storycloze_2016,acc,0.7060395510422234,0.010535087882304173,0 +winogrande,acc,0.5698500394632992,0.013914685094716701,0 diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_3.json b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_3.json new file mode 100644 index 0000000000000000000000000000000000000000..f9f7978e5ce57ecd7257720f4a5041206b0aff48 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.339, + "acc_stderr": 0.014976758771620344 + }, + "anli_r2": { + "acc": 0.357, + "acc_stderr": 0.01515852172148677 + }, + "anli_r3": { + "acc": 0.3383333333333333, + "acc_stderr": 0.013664144006618268 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.3707141840944658 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.46036646086436966, + "acc_stderr": 0.0049740806383642665, + "acc_norm": 0.6047600079665405, + "acc_norm_stderr": 0.004879030010598914 + }, + "rte": { + "acc": 0.5126353790613718, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5698500394632992, + "acc_stderr": 0.013914685094716701 + }, + "storycloze_2016": { + "acc": 0.7060395510422234, + "acc_stderr": 0.010535087882304173 + }, + "boolq": { + "acc": 0.6039755351681957, + "acc_stderr": 0.00855388133681342 + }, + "arc_easy": { + "acc": 0.5879629629629629, + "acc_stderr": 0.01009976585756276, + "acc_norm": 0.5606060606060606, + "acc_norm_stderr": 0.010184134315437663 + }, + "arc_challenge": { + "acc": 0.27986348122866894, + "acc_stderr": 0.013119040897725922, + "acc_norm": 0.30119453924914674, + "acc_norm_stderr": 0.013406741767847626 + }, + "sciq": { + "acc": 0.873, + "acc_stderr": 0.010534798620855752, + "acc_norm": 0.851, + "acc_norm_stderr": 0.011266140684632163 + }, + "piqa": { + "acc": 0.7486398258977149, + "acc_stderr": 0.01012115601681926, + "acc_norm": 0.7475516866158868, + "acc_norm_stderr": 0.010135665547362355 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_4.csv b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..7ecf5ad83b8fc392a02b96c05f302fab62e032e7 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.352,0.015110404505648661,0 +anli_r2,acc,0.345,0.015039986742055237,0 +anli_r3,acc,0.33666666666666667,0.013647602942406386,0 +arc_challenge,acc,0.27559726962457337,0.013057169655761836,0 +arc_challenge,acc_norm,0.3097269624573379,0.01351205841523836,0 +arc_easy,acc,0.5829124579124579,0.010117738967781995,0 +arc_easy,acc_norm,0.5681818181818182,0.010163945352271733,0 +boolq,acc,0.6024464831804281,0.008559523256936817,1 +cb,acc,0.42857142857142855,0.06672848092813058,1 +cb,f1,0.2523868825238688,,1 +copa,acc,0.79,0.040936018074033256,0 +hellaswag,acc,0.46046604262099183,0.0049741595613426995,0 +hellaswag,acc_norm,0.6078470424218283,0.004872326888655508,0 +piqa,acc,0.7437431991294886,0.01018578783156507,0 +piqa,acc_norm,0.7453754080522307,0.010164432237060499,0 +rte,acc,0.4729241877256318,0.030052303463143713,0 +sciq,acc,0.874,0.010499249222408037,0 +sciq,acc_norm,0.861,0.010945263761042974,0 +storycloze_2016,acc,0.7167290219134153,0.010419760409155363,0 +winogrande,acc,0.5808997632202052,0.01386732519221012,0 diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_4.json b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_4.json new file mode 100644 index 0000000000000000000000000000000000000000..43f0ddab460282ff7477413fbee6c9c0ea95baf7 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.352, + "acc_stderr": 0.015110404505648661 + }, + "anli_r2": { + "acc": 0.345, + "acc_stderr": 0.015039986742055237 + }, + "anli_r3": { + "acc": 0.33666666666666667, + "acc_stderr": 0.013647602942406386 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.2523868825238688 + }, + "copa": { + "acc": 0.79, + "acc_stderr": 0.040936018074033256 + }, + "hellaswag": { + "acc": 0.46046604262099183, + "acc_stderr": 0.0049741595613426995, + "acc_norm": 0.6078470424218283, + "acc_norm_stderr": 0.004872326888655508 + }, + "rte": { + "acc": 0.4729241877256318, + "acc_stderr": 0.030052303463143713 + }, + "winogrande": { + "acc": 0.5808997632202052, + "acc_stderr": 0.01386732519221012 + }, + "storycloze_2016": { + "acc": 0.7167290219134153, + "acc_stderr": 0.010419760409155363 + }, + "boolq": { + "acc": 0.6024464831804281, + "acc_stderr": 0.008559523256936817 + }, + "arc_easy": { + "acc": 0.5829124579124579, + "acc_stderr": 0.010117738967781995, + "acc_norm": 0.5681818181818182, + "acc_norm_stderr": 0.010163945352271733 + }, + "arc_challenge": { + "acc": 0.27559726962457337, + "acc_stderr": 0.013057169655761836, + "acc_norm": 0.3097269624573379, + "acc_norm_stderr": 0.01351205841523836 + }, + "sciq": { + "acc": 0.874, + "acc_stderr": 0.010499249222408037, + "acc_norm": 0.861, + "acc_norm_stderr": 0.010945263761042974 + }, + "piqa": { + "acc": 0.7437431991294886, + "acc_stderr": 0.01018578783156507, + "acc_norm": 0.7453754080522307, + "acc_norm_stderr": 0.010164432237060499 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_5.csv b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..70b1c4b9a5bf6a4e53ddcfeea90038adf78cffe1 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.35,0.015090650341444233,0 +anli_r2,acc,0.326,0.01483050720454105,0 +anli_r3,acc,0.3408333333333333,0.013688600793296939,0 +arc_challenge,acc,0.2832764505119454,0.013167478735134576,0 +arc_challenge,acc_norm,0.29948805460750855,0.013385021637313569,0 +arc_easy,acc,0.5854377104377104,0.010108889212447777,0 +arc_easy,acc_norm,0.5660774410774411,0.010169795770462101,0 +boolq,acc,0.6085626911314985,0.008536430524403955,1 +cb,acc,0.4642857142857143,0.0672477765493766,1 +cb,f1,0.23666371942234013,,1 +copa,acc,0.76,0.042923469599092816,0 +hellaswag,acc,0.46086436964748057,0.004974473255391268,0 +hellaswag,acc_norm,0.6085441147181836,0.004870785036708273,0 +piqa,acc,0.7377584330794341,0.01026250256517245,0 +piqa,acc_norm,0.750272034820457,0.010099232969867476,0 +rte,acc,0.49097472924187724,0.030091559826331334,0 +sciq,acc,0.878,0.010354864712936705,0 +sciq,acc_norm,0.871,0.01060525678479658,0 +storycloze_2016,acc,0.7188669160876536,0.010395836091628122,0 +winogrande,acc,0.5666929755327546,0.013926915052757347,0 diff --git a/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_5.json b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_5.json new file mode 100644 index 0000000000000000000000000000000000000000..4638e118936a3f27d118376b438a3a42a6afeb30 --- /dev/null +++ b/4b284b6bc4seed2/evaluation/rankeval/4b284b6bc4seed2_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.35, + "acc_stderr": 0.015090650341444233 + }, + "anli_r2": { + "acc": 0.326, + "acc_stderr": 0.01483050720454105 + }, + "anli_r3": { + "acc": 0.3408333333333333, + "acc_stderr": 0.013688600793296939 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.23666371942234013 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.042923469599092816 + }, + "hellaswag": { + "acc": 0.46086436964748057, + "acc_stderr": 0.004974473255391268, + "acc_norm": 0.6085441147181836, + "acc_norm_stderr": 0.004870785036708273 + }, + "rte": { + "acc": 0.49097472924187724, + "acc_stderr": 0.030091559826331334 + }, + "winogrande": { + "acc": 0.5666929755327546, + "acc_stderr": 0.013926915052757347 + }, + "storycloze_2016": { + "acc": 0.7188669160876536, + "acc_stderr": 0.010395836091628122 + }, + "boolq": { + "acc": 0.6085626911314985, + "acc_stderr": 0.008536430524403955 + }, + "arc_easy": { + "acc": 0.5854377104377104, + "acc_stderr": 0.010108889212447777, + "acc_norm": 0.5660774410774411, + "acc_norm_stderr": 0.010169795770462101 + }, + "arc_challenge": { + "acc": 0.2832764505119454, + "acc_stderr": 0.013167478735134576, + "acc_norm": 0.29948805460750855, + "acc_norm_stderr": 0.013385021637313569 + }, + "sciq": { + "acc": 0.878, + "acc_stderr": 0.010354864712936705, + "acc_norm": 0.871, + "acc_norm_stderr": 0.01060525678479658 + }, + "piqa": { + "acc": 0.7377584330794341, + "acc_stderr": 0.01026250256517245, + "acc_norm": 0.750272034820457, + "acc_norm_stderr": 0.010099232969867476 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2756c15cac8ef15074ef2a4af5652eb5e06274b1 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1728bbe9d573179649c97e76dc0425ed2b915b13793b24961e976deff33a3909 +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4f946143a7af88061188ced9c4946227d0a036c --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61ae195149e9b7696b01f7123478868f9676ac6dc2c8f74e42804b8fb43617e1 +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef49bf8b5ed011454f9f8102bffa3b74b689f422 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b85aad30d50e8ee77ee5bea4c7b5f3b8d1bd11451684d1961055c6eb3f950b8a +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24fc1ab0776958ec159f8f2921a48a344b0672e8 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2db4bc1c0d1af8209027abe6eee35b324fd97dd3ded5aaba697af1be7f891afe +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f3282082528ed7662e3162de434136ebf4b934f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:496d381b1630117a4f337ad2b87a7c91aa445940bbf25beda102865d47c93d59 +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c466851f083d2826524295f59a76849d7d1d3a9 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dae156422d8b8e383f1b46e930c55f310fe748a77fc73be98ca6dccd2bb62c1 +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30f031b098f2ea698e1ce246d69fc94a396f0510 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34fa300b2ed7e266cb1226086db9da14a007e898b021585cc17c4447c6fbd09e +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5df11c2ad71e50e427c8d27622d3f394c95b024f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6e68200b42b7127accf41d9f4a39ff083526ff7f7d30fcf62550351ae32e1e0 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..810505b0d2564ae5b161ef0183d02f480a28704e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:218fde624822c2c74b5c38aa58eb23adf1e191dc18a9f79a9fbf2ddd7a8fec59 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6af8b45f14b9e89a25a37874ecef3e40fe5bdc39 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c768bbdb3941b28ced1a7c7c1ee1db30520814781f108f28867a982ae044d0f +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e9ac062838f60ad787d860b99e050f733cccab5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e88e24d6fc28b2af58c9b40d6f953aacdd0eca125510830051588e54e95eb66 +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98e6d9e77a7895a08dcee4ae1974412104e4da8e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d99c3b816d2cb15dbb27282f6d418bc4206c59fdb5cd19a84506556fa42f6cf3 +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16bfdb742eaeada769b89f40f78b7fd56b8501d8 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fee95f995988c1b84ee270eac54d602971b1e184391b8845986039afb4da3b5c +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fd3bd8b7279f05ef7614fbdbce90f73ccbb0869 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d7b551f240911bde95ee7a0c3084ee7bb608bc602ccabbd2de4daa32a2a93b6 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fb03de13c02ba8cc420e619832fd7aedeb62791a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:382ed7d92c6bea73af9699836556ee2e4c7e38daf6b5bcef8ad067cc75a809f1 +size 199058669 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f4aa6b58f3936817f897e2360fad416496c564b --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8e91a62b651ce637701383ab80a23d2bd47d15f25ef5640c6b5a2506038a7ce +size 199058669 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75c8718a4d46d79776c6eaf658bad15bc9325617 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f31e9fb7f08af235e337257d205344bd7c5230ed3eda73a6cab526e75813fcb +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c204eb926397f80b5bb9cc92e3d3e4bf8c061779 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c54b32baab3cc759a32f83840f47246aabbca14f4d5c5148a548bf5ec48a403 +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2771d5e54eba21983024836a4a4b5ab393de3f8 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f189797fce258b71d3fb29d25568c982decd20f2f9874462349b24d3e1ef747a +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd35a6242fce4cd796db34ae11e34b0087de23dc --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0d8c2dee863a1508276cd15ff3c7395dc155dc7a9c577c2af8de40f70824675 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..192f96e9f497e2a89b19fbd4b0bd1a7127331a5e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a8cd2d490c73af202d2e598c3e2b5ccd38dd6a4479370f1192100a1ef9ada864 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dd67261b75773c8cd92a9533c6ca6f12e2c65f7 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ce796cf2473ad82dbb0ba043bd2d2a89b7d016eb6981f8962c5730d8ead9239 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..686c76314f685a39367d022e38374a36a9647180 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3958231d76d9c2a7b01316bc53451e415e27bb3b11fd69c5fb5c03ef106ec586 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb33ebab4ede5db34e064633bc5d9b47a8131589 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bf79656112d6080884516ab0a977b2e856d9c2eadf0aa8835473009f79144b2 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a73f0c6df377604a54ac7b4e3a38a4af0e4459af --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95f746477625c3ff1ede016aa76356e2e93980f326869cca48f2b70987519bed +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce53e40771a7716d9db9b38f45d0793f9daa7ae1 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d33e2c9ddd1185ecab521a982aa17de516813e00f91636b69533a184820bc95 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5cbc49ab9666e4510717e903cee7c4fea26c12d4 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab183450d8f155d71c6da10ee57c10253a557f8e28baa4178250a6d00e9e4cf2 +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91fc9adb5302139a7379b2f0f810f28f33903fba --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc001553daf5c670ffd38e4168a58f82cd7734c991effc64de4cb508ef75bb24 +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5aed42675995a6555c7355836fd530a8e1db838f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f035efee3ba6f18ec582f8eaf7b888b8feca3b2143b5efb0e8b67768123e64f +size 199058605 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db22f96d92788778b74ffe2cf5d85b43a991d1b4 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8cfe6d762203fc833710b14620bb0ec6acf97a8746c5c949ac800f36945283c +size 199058605 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ac06552205790cd93acf05ab1a6f12be2d1c4a1 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b6b4382ba170799a01de7e797b6a9b53a26425d0fa23159d475b84f6ccee5d3 +size 199058669 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..151ccb8fc798d0391f83fae3bed49e49897b242c --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d702d536e9f1dd5f1c140e06f1f0d39a83e3c8950b9d117185270fcc16892751 +size 199058669 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14f9f9b3ef0cdbbc5661c8c09d8a12082053c57d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:075b792b3bce711ef1d3674e6152ed79b33fe60b4b8bb99fa35ea4f7ad1ec18e +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4c222bbddcc2fff7288a8354fe7d85406076e44 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fb08ca66fe3ea6aef562398bc11f07e80224cb713794103e8696b638a2953bb +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18c5f31f56d162cf082d7029112a06999b2b9cee --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:023f43fb2f7676295b74e93c526fe5a7336a7597c3c8182b4065e213da4b2e90 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afc54f78708181604c37e2a038b2a199229a96b4 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:680db5f7b3defa9514b9b72cd0680f7a8b284a4fb616ec57b85b93401dd39e26 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06745b1cb4e2eb2fe7fe4bab3b120b56d8a14ce0 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dae1d454f026607aac1040a5502f43e6671219fb9e6a3f19f80eed6e0ddc5c8 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3b80879f056e7aad6270d20d575e443055d76d9 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46ae06f161e3a12afe7e6ded8f0e9cb602596dfd44fb2cc7925d9dbc4e8337af +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63edb052a56792b895c410ecf438d087ac96a48c --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71733877aa13d99545b0b22f5bbf8940df947325aef758ab42193c43e3622c60 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d3a29b3a2e5edc96d3cf3676d7516a8345f408d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:050e82b34f8f750e5fb40dbedb29a40585eee92f8140f92a70ad494c54449386 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06d2536d75406cf6ee202af8cfa999676859eb33 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4bb7707327c9ce9814fdf37a3b7272c4475b6acf61b956c5bf861ff1801097e3 +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec38930ca60f20d09b50bc56e6a39e99027f0955 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6318ce82542e94527491d7a27d143bdc505460e47871518172aef59ca51d5b9 +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63696c766859e0efbf0f90a22916ba0ac58ae68f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30b53428c5ffc813b38390acec54038ff0fee3f3817410ae35653c08566e9a60 +size 199058669 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..832932c3ef4d605ce00560040bc2bd82480c8ded --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:803f0c1635f781be2239413dd2ecb6e790b565130bd24223f19c462fc6d164c7 +size 199058669 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a846806bc704305b6d8459f8137b8cf058f57a37 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3452dc49dbf5804bfc8532827776f941693c7413db59504234e8def1830f49c3 +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a34672372559ba980e939be81a89a486de29820 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a9e339d8d79e17bc70506d117646a92ee90ffd64c0e8b299db555ac7ec7df8a +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..350f339b26618c508272fd80c6ea58eae90294eb --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16706bc926d8b50a15ab6c85745cb6e0364f092e4ac8e4f0ea8db2f47871fa80 +size 199058669 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fce40b4117ee99077dadd97cd822540b0da90fe --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f80cacfce5d28cc1fd13effe383bc2bb0609ca1febc8a7fba91d047bac793aa +size 199058669 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ef003a3b796563ba828a19ab4be189c658e7e00 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5a2b2f595d67a85fc4f019f3dd19816065daf7bcf8ee27f56b2dd49ffd3dead +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1f92e5af67a38d47059395aa2ceda88da1dcbfc --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30edac46d98f7812514d2c49cb5181cee896b62a05aff2bebaffae034d3ca643 +size 199058797 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a1b3f85c28666e443ae1e9389acf3e99abd6612 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c211419ffe9b552529d8b6fc775d93d19ff19c2c18f41bf5cbbe27ce548b455e +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..17d1f578e1e2ab5a8d84fd983ede5557b8fe5b64 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebbb71a4178c1771c036e1e891b726669cd0f68d80c304b9f8a623a1c2d2d647 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b19ceedbda5c3ba56a8306ec393dc53e01bc4e2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ae0508334710e64a5046571cf3d135c8250bb18aba09532a7e445d2094c673c +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6190085e9e97244d5e3b5272aba87fee2862ab4 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c50ada51927fff7be3e83f1b484b3f20d0dd24712d27fe64ac91fc5d57cca50 +size 199058733 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31f4b289d688b78b41bc3ece3e32d3d303ab525a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f390f01c728d8eaa9f60182af9aaa7a0aad290bc19f810f0b77035434f1e119 +size 199058669 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fd65db4fee2833566c10737c785848d9f6c31b26 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4bfa77101bb1e63b6fb06e44de609fbd80fdb5b1d99188b4f7f1ab05b96d21 +size 199058669 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16b83ed3b96796405330f2917a7a1ec956dd074e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:362957ada4eadd59d478ebc68a1c50187cf706f2dfef45a341a1f06f03e4f76c +size 199058925 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6d7354f744a2a9d27441646ed2356088cbd849e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29c7c2840fce4333fa1b1362cc0278ce096c556bdb753b95b2fb9310ee9dc3ed +size 199058925 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a984da814db71a20c2e2be2e506c5c894cc3c7a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6344bdf66da80dc6d86ae8203c6baee64c749df176879b375bb53e6cf4b83d14 +size 199058605 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ae52fd7a5b20c3f81de73bcdf60eb7124f82ef0 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:404d2919bdc6a012640bc2a5fe62759dcab5d332dfb35fbf8a6e3879e511ea03 +size 199058605 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20ce6bd7b21582723654f703e791e3ea6b2a50ef --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:189af18d3f49a4dc9011d6b1f78c2072ebece09253afcab4a76b8e9249fa71c8 +size 199058605 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..018145240179d7854ab588f66e4b49389b8ed5c2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0aa3420757ca89e9fb40b1150a87c5daf205477a96ad84104d213c8733644f65 +size 199058605 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..59b1c93113298ddc68941eccfe79f44e8deb7668 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d85c0efa7e15bcdd47ce229454b9e2a062fca1e747f5186b759a8df23a727d06 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bfaae244ea67ec0c6694410d2f5d07e1294fb1fa --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9a21927185337f351d52917c02d4c1523274cff9e7c1b81f0375a18d1de22eb +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4a5cd86b001f6618bc02938a2ae8559ef5b7b8a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4dfffc89425772e4f9c8fbde0c9e63ce55adadd9ba459cdcb1e4ab600ae3d1c +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c95b15f6f5689e88518ed827e4e11bf2d892981 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f70bb8d19788a2020dd337af5498a6850aef92dcad72252aabfa7d7684d5c0c +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..705c44e0c80bc589c7c0e3ebc492f9f8558ce07b --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e1f224ae3dab5135afa6168cc3a7bb1acc1f6533f8753aa5806efb12a24fca3 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..696c178e725bfb31a74dc3795eac6910035f7f78 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a0899f2e268fa08cdd29c452a3154c30f8f3b8e0ce94088c9764be76d5a05226 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a2abd2b293368da0c566476243eb7619c154b4e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:219dfe6ee3f191a9e07e7b9b8af49eba28a457bc32619bf64081a32a5f8d2e05 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8ef1fbef18b1d3a2b0eb355bec230d7c3829ca0 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59a46172213bfaad30c52cffc506bad411942af5f484ea1072eb3413b964b04d +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f50b1169d3ec86b23e1622b06a30b56857e79a2d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e798084a0e0ec44821d53a8168124d6b665f18bfd0737896b5d5f13c12a462f0 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ca38f793fb16f2c1eb7f71fa715abbcefe15bf8 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:843dd3e274f1eac24a8a66e8f43e72a1b89f591c8becb3584f2d3c42bb8244df +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5718c40df65e3de2430c69a72d17e8b982bc3ea4 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cca1310097b86e907f525ff5bde0ed48b513688c3bc967de15841d68210f074e +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef46ea68bf8a7191d78948f1e279910ac275d5a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f5b2874ea789e54d5b3906497598d33c23b42cc1fe17e13341c87edd80501f21 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ba9c53661f2b6bf1c0d4d89710fd1a0aa3940e4 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdd1888362cf069c9588a2c0218211be1d6dbde55df19a938b06cfb49c2cff3d +size 199058978 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5f9e759b8422896cf7b5a9e4c306d66460098442 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b464be08e7e2c68c2812b23ca09b1653dc9f8f89b1bd6ef68261b0c19124e255 +size 199058978 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f08ccb19b8ec443984bc0cf14579d96214e2b2b5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:888ac2dd882dcf158690ef12a19d6eee3be1bf9878c3f43e1e53a054057e7d8b +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..063c9984462058447db95a38626b92d12603f702 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a19b3ec9d45fd4507a31042ac435623b430e44f14b62a3f1680d1844c73d25d3 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20d999132376ff26ca9cd6775e3d571b570ac43b --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc315db1f96326bdf2b17ea97d6709554b9564776efe47ecb5e43e69a4b5bb37 +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34881ac667948de2b46737945600c1d513f44d4f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7be184d22d43a5c0025b4f7fd1c69a0adfb08bdeca665bad87dffcafd90a9675 +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ebef343a99b09ce3fe59ec39b4cf9e23a98a22b --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8f1b353cf9e91fe23b67821c1768f76162ea050e927dee4545303ba9a9b7cd4 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58d2a994fabbd3d2c34739bc1f2c95c2ef09b283 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e57655bce21de10c56c32353ec4173651c5ecad9b2f01c5dd9a9a8e3cf4a4cb5 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1c16645210d505100e81e2afd5aa640fdf26091 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda71b9f6e8d8663b4fff85bf4f784d2fd6617775a5e5e50a9e4e2196fbe96b2 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7f10e2a2293d273fed187b2be551f4dd86eefcbb --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4512f00be9f6ca848b8db23f811bda003d4666a38cc970b61fc02721535ea61f +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..96cf8240cd004cfeced70de8e219db7f17185526 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45e55bf84e15d180836816ac5bf0971e2b80eedc6c0ede12f2c6ae47f173b6e0 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2f2df2589892ffc90c122c824e47527d6a09751 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b7b2230a17e9dad222988663291702bc3acb9a782311f871a2020f30d001a3f +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09e1d2e495854af8579a3131c3852c7045d57560 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdfb803bcb8fa00b9707ab0ff2c3e119d6cdde39efef1c3c394e2c9ba0384921 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9eaca13d71a3f366411d7989567fdc5af77f69f0 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:673c5ee5073ee6831a2381a31dc1fb9a6e4ef82a0cfd193fae4687cb33b38113 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d2c88b36e74b4e98c8ea8659daa6dd4cb57bbe7 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c5bfe71967a3a86c80b864a15ae7e366af04b1bdb11673310275935fda09dbc8 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1997dd80c31078f54930305f13ab77bb94e629b7 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9239d2a0604424eb22bc88fa55d6ef2304ad4d53d48edac38d6acd4cd92ce56d +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..88a91d5cef558783e3b5f00160f11444d9419178 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e0bf5da35dd816f158057eade92b1cb90cc26424d3a461814eddc37671e859c +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..724b11750731fb847e968b3c2566ad504067f005 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71655028821353d94dfb98696a68ec4c32ef4e2df1b47b6792200096728834bb +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de332459a8a22bd3f05e6a69257624656e746883 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c9eeb0f55009e5f957bb8aef4dfa48feacedd67f4721342d7c5ced95adee385 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b7edd238c118bf358b4bcfb46cc641c102c7521e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d566cacaba69b8e44c78fd478e91ac3f4dca80adb2c06d56e8d1a1d07419d92e +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8864c50034ed5f4026beb66859adfee63eee3ea8 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b86aae9449d1db00193bf2336818071895748849f527dc291ab9fe3734b50a7a +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2da856015ded2055ac0b07163f9328273d82a220 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:135fda414382f329244568d30874e08e4ccea7d5bd634302c966428a42f5714b +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..975a31a710667c4a5a610bef5c9d05995a4697f8 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fc701f536024b8cc7416fd79e2eb28a440268ae2ecf9003c8db41ea830f47a89 +size 199058594 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..671b2ae9cba02dfcdb1130dea997653248aadf13 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87fb5af6488765429b7316e28ea31068776e6cbfc59d561231bde7fe731e2e2a +size 199058594 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..780b052c24bed0f02efef59337264ef2d30f0124 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2c8e68bcc75352ea265bb0ff99d315e443f30fdb7bbc6f382757c8680364639 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..129bef77cc8af4aa00b3e9192043a51b7a0c89f4 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7724b1ee42518c693f7a7eb645a317f4688975ffd5ce2139f6c60dac674c467 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c5144c801de87fb360490e6c22b5f3679e52fd5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98bfde0b85cca9785a9d88cacecd6eabd1abe63e66f87bfb27590fc50c27029f +size 199058711 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10012010a123c573b33c56993d0e3f7ddd15282a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0eded4c28ba9287666eb0899320e922fa091ab9c5f8ffca95bf1853e09fb98c2 +size 199058711 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d55b7481c97975ee251336bc54b86739c0165f5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4ed28db7333d0921740b67f70f6a03964720ed3319a688a2fc33484a3dc474d +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ebda91814e24aae40e0724bebfeff9f549725b2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:400b83509fed822c60cc5716b9f684c84dcf03e9b4db0e405c5f192152056332 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1068b2bc03d210cbe1675edfddee08317e74dabb --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:896b6eb840f96a607499ff6c2772411f09188af29e5e4b9de04cfa43cdf4ebae +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a9e242249fc809a29584e21d3ed66e0a0a40a24 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d075cde8140fb6ed70d7b4861077c78b6db8aadaaeccb8224eda3bc4d12ee259 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..758c7a1755cdf9d0f0ab9da84f4b57e1e658a9e2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec7d5bc61b7137e8ed1f9dc3ce0f5f23d4a87a34013df9f9db6630361b441bd +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7df2ca83c2aeae7d2d995c8d35463b84e71d0346 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4d69520cec799896a3acd22bcda114fb810f368ac47bbcdd7a9f602f04c9cce +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c79b7a8a2707622c2f8872624270140c09b0fab3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03e9ddebb8ad920ff5763d228fa1aeff3ed4e380fdf07ab4f054f0ba89868c68 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1910972e3dc55ba35108488d7954ca1fc5b6154f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3c57143365728e060f7929a80204eb919d70c98469ccc9fe194232d93ee908a +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1031addef89df54e5e793b44d8d6ff41a0cb32d3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f80670861d8d116f81b108a28a8b75159db6babb30fb8927417334a44ff75b6 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9254c666f04a424695ad9e0f1c7b3e8ceda878e2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eaca44f0f701457ee108876f9843738f2d8ee592ac619de4a08a61f2b6df613 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14722651a16faf97f8a2ae8fd12a4e7ee4e52c5f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffbafaf3b3670c56aa4c19c42116b0cd953f2662db223434fa3fea34db80782c +size 199058594 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1acf3c7e040dee5cc96632ec3bd7a8d5f5f3641f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d4a39bf36929ae28e861914252c854f8f2b6366356b80330355752bc117d76b +size 199058594 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d854bdf29dfc2eeb5ca33cc1a128ddafca43e1e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dae0b6b0b0b11601da068d1eb833eedfe66d7bf4555fcb8a2d0b6c9e6b4baa5 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..65c79310caed9df02719dd4eb2d8b5ec4d88d704 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4689bab0872ba1866e48341125d2ca4deff96f5f21a85c9caa411eaa4fc4d3ef +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b94669e615fa8237ad0c2dc9fadd7ffa5180213 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56e14ca0d47ed85a015ef4ff5fff47da1777e1569961a42458956571ebafb27d +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04d12133c84f84238b14203ee8ee0f804bff3015 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c47dca4e1c0fdd2968d576e7ca8e4f5ca97d3c15f4c619a686f105bf09f7b812 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d656654b6b35efa9658f22fbe95d32c1475b2ed3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c49826a579c6e3900a66f222f208fe7858084204dd4cf6738492465a7f91306 +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6b355483132f7ac1a1b0cb7dd9c73cb9b145ed7c --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15c104a7cecf32b2c66844235a3248fd3f0a73163dbe14c91d218a9f0e45be8a +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..994758d404ef3ed2316f52cc2089994362665699 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:562c927f7ad0a85ee9be1d99fd4750f00fa4665db787a57bf00a0b90e93753dc +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbb2483ca38a94ceb8695fda655e81ce7805d858 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8464d8d4053cb350ff7f02fa2b5c4f6e064e64f3738f18f4b4c037b03e84778e +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b5757d6a3054c0600c28d3476fe0119bf761f00 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9d9f20ef868615c0435022c89491878aa0b6f4b5e4641e45fe9fbab7d7cfeef +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bcd55c637f4d05c6e1bd3abd54ecc118ad49573 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:327e8843a6b9639668f3121b76f5fcaff84ba72f498e246f328844a1d63374b0 +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a4185799be9cb9ee110b296ca2fea276828d039 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c0efbea7fce04d08a61b7f1ff6c81468b11829e0fada7cd9ba6960aa868945 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3244617075a89a247df64c0617242d2fbc7d338f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e81e2f7008124929d510f048f8878bdfcb4886b0e0c89499ae7c437c09ea321 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd6770af3f07aee43325240727b0aa18db337423 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6bf9d0073247bbfff6c13c70d328f84b4fb5a2114e0eb13c4697e2454665b5d2 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bed2befa324643956677f2e40b08c714d844f41f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdfef537a50648668f42d3bbb059c830fc3c992c614106160ff671fc3724f151 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3953302ecbb7043b63979762f7c4d7e9a8b589a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da8ab521e60712f9df6688444cd35120af6fa9791bce8ba9bfa2034583663554 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2166dff08e95411d94f9bedec8932aeac22772e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b4e90f363fdf0df1e211b4bd5fd764f77d7bdc9906a09846c89997353dd8e3a8 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51d1d88ec5181cf966500e60c53b512856c2ead8 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:68fea17752fa963b16251ca7ffbef8ae706ec3fe89fe78ef8a101ea78f3edd2d +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a43c66f8f2daae628a6df7240b4a1d58f8a3d01 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:33e3860b9001fd2985324a7cb41605dc43c80665ad5aa3d389533d2746d3c999 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5e2ee90f4b9241d9b726a8adbb412dd188febe3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37ad7b0372aa2452f3b9a6d1f874ebdb6dba7352cb9c16b27ed222c86268f211 +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0888b9388ed0e97d3f0f882350ffb8c9492666f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88aad16dca7058ce7908090756232d8c10c2886f5486df4cae3e419783c584d8 +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9c5e7b93ed2e0d5c964df7fd9cad76e3882fa3b --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4625f6989749a6e44c96b196a32b47a118b195259c26fcc383749224a2b3d884 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f6e5ed9a19d6baa2a1be45a3fa9dbb17d5335563 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09ead4d15715b363915e46f529a51b568ce7976c1361ad768e382037bdbb54cf +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e72bbdf53deb900f54772db0536a809b3b5384e2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91a9067041e5aed54501060395b0ee8c293c6951fb29e64f5640b4fe0083afca +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d03a655ce77b750b12141ae736ac76cfaaad410d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bafd6cd4bc7ef60fbd57e26f012aa9e2dc880dc9bda8b982baf8203c7de12475 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7cd5854b0269111dcb5819f3a7e7984aaa1cc2ab --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:61e46a2d4e9f7b7a4aad1010ba3e1fcdb927de9651e3e923119972932845e185 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24737e0e1acb1a5b96832a4691e2d8a14594a6a5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:842bab39cc59ca2f3a3935c969cc64f6645bc56fe5345d7abf93a634d72c5c5c +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0ffb4d96605b3bce833e43f4bc6b7d84aae81da7 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fed1df56472a99b83100b6ed4f027f2ccf9446f266399b0328838846552e39d +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..138b29a31b92b16425abff384eff0877f1b55e69 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ac5e80af2ad12fcf17c777b91c1562686fb976a0f2b49776ab24f0c98c8f357 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81ce93bd94ccc99c112a1845e8fe16e2f578985c --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d36662b15bf4498c544aab6d4ec73073dde07e968088b478c553694ca7973884 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e5f6bdc092ff8b57c6db14a5df728570ac803d9 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3b8f190f8b57af513223d6197cc2606d9d55ef9a51a453f12c2b4a251544c611 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c2a244df824063cc974a21e17e7f9e393a6a6a2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11ad040f332cda253e5de5392391925e8ef04640366d50000f11f4ecdb69b486 +size 199058775 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a4dfcfed712f7214540354b0b81dfa24fb4d088 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0730d84b7ea469e91978b4e0e79fbdfb191663110e5a00f0ec675ea0e295306 +size 199058775 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67ec14b68ee7a7cf045791812551685160bb3dc5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a80f70e4291decb447f51eb5f16d380b72f4d167c44e0885c3f2c313a3e735e +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ed588a6736afcc7435942138df923575792c37a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:464aec78407d6c97c0fd0acc6e5ada9479f86fe95e4441db84e80fcaff72a0f8 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48cada99fd7c23a8ecb757ed3fee5f7caebe01bd --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:614f8358fdb2606a2705bc58a67bbbae84d71fae6cf6f075883763d746268fd2 +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3151800e2aea287b44241486c0c64bf73629f0a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:537025d5087e376332a935736a946cf47ceec6abdf37670feade26693f2f4e15 +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..426e44b16d79c53e20710058f6f9a285dbccb82f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c00eb6999540307b42ecf6e6049d065253cac1558fac5e1865c48a15ba924371 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..477ca89dc0e8d417187221d6527b414b40c54927 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:795bebe67e1feaeef106b0a7ce508641a7dbf2ee5240f5e1b5d129e7ccd36ece +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..796007e3a9fc35333f582cdb0e55655f8a2aebbb --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc01e2dd66c4cc0dc7c734011b359005bae11c24d4a665c51c509d8fa3dec567 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45b1356f2a679d592085b011e5f33354842646f5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:367579aafc370e3250ed990e5c94a78416ede90d5a75dc486e013773bfcb9ab5 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..783e841c3fe73ae037272cc093f24415cd1a47c2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:712a4a2b866afa3a61d7040770ac2ab2e39cb7e41eb94dbe66e691e99df4c858 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6c33a6c54c7d83f0a0edb0aef0eeb37587dff59 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:705a25145d2a758fb703385c27ceb4db138fb01f0a01ce63fdb0449bc6cfd7c9 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49a5087cfeb7f227a6271110a728efbf85a2160d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a547b59c4b229914bdd4c84a1d9d7e2a70662ec06a26e77827390ad8af9a5bd3 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4a90af1749b64369237101f041beece3f0b9c82 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed3516398c70cec6ffcb023adc945a1822a07b1a67c245033e3b46da68c7e4ff +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..388150f9b20c93f5217a8af2cc5bd04a3fa340e4 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ec81748c75dbdaa8dcf8d5ea9db3dd2659f56a770692c0f08782e9e1942f8dc +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae3f860b3ecc5ee08a08f9cd3a579fdd96674403 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6da33bba1409de18b67d36695b2cb178d93ab04c198a4a733f6e61982a39cc5e +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80a23a48a4f0773c360b95b8145be1fb28d06f0c --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ced075bba941c5dd83b2dcc8aadf17008784113861c2eda84fb8863654e0f7eb +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da4f7cd50e703bd8c1f3a00c36b7e8c54a1e1f10 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cfee3422ee82c1f6bdee1a3e69a02d3c0356cfcfc3b5f23fd39d726f44a4a8f6 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7151665b3e843f0a51aa3459ad9d63059ee8d2b2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:364616e0a97320fc44aa653b373f4db901f7406a41df396debd250150c776432 +size 199058914 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..34cd8a33258e637ea4fcadc506fa2f21969d356c --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08423203555e27da58981b40106fb30aedfeb0611133fecd8daa927a5aee9b07 +size 199058914 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c3d59475409154c63d89377b66ac7b93d2164f26 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8bb6da33d319b656566728a70481d76aaec06c983d7e82a6a3a5481ee3e627b +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc756bdf3ea3348e6ca2f1cad26fb4f2044b8518 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da9a97f8bfd32e615e6edb3dfa8ab4180480ef7ea263014cf56e793822b7ffda +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..13728af40be78b06b3c06b443371b39e0edab327 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cbf4805f255ea9c913b141f36b5933547e300e0f2aae45455e6432c5ae07123 +size 199058711 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..30dc5364d4829732d77196992dcb418120b7ebdb --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f9b659bf0f6b35df0e0738802671fb5737106090e2f01089895075fbe7e7b751 +size 199058711 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf04ed05282ae36fe233c5656b30e52ef51d688a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad3a9e4d11259ae04434182d55805b2f41f740a663fe6c91042b0a426968521a +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c927ccd0d61d823ec9ab4643baab26c477350c0e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc59d01349112953e5488a3018e876ba82b8c7a4b77ec395c66f13fd8172dd3d +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..417286d916387f879d9fc084e102a185d31170ee --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df0084148c7469a024a7b5a6f602b927d86f534877224c5fe15d1f8d277860e0 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a8664c81704616426847d9a386a7d5ce07759d4f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:357914456c28b616c385c0169dfbd69eb218e64ec2ce8397db3705b3a41d73f4 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..89eb32d944aecaccf8051f106f6d4ef35b25ad8b --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94e98c82a7d3f8763abbda1117a92e3794ad50a0519c3f60ab9757dc20df8631 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3fd4c763d4ed8e5d533824412c7ee77858a2394a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:874d932b8c4694c91fa16dc27aa5d26c3cb923feb35eba450be7cd2b84f42f4d +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3061aaa1354c47a0b43b0def4e1d4e3cb481967 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:212e6a435d458ae9a57dde6a28c5d7cb03caed3d8a40f2c0c47412b0938934be +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..256d34189f4652a524cc3fbe6d71c57e54b521ee --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f6b92819c9394797e3b60a773b3050aa23d205593e4d547ebf1e160498dc98c +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8df7197aaf1ec9d2db8838fd0a3f536912db25ef --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22b534e1a39e0106e6e233c0b179f1cc791cb0ec5cf0260ff43c40cc5356a7a0 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71421334b73dd5d5de7ebcd331e422271c3d6026 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c48a4941906f378934bc85b561f61889243b5f3eb5b25f60a315bdf8b79e956e +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb6d430ab8f95f836800c2811225c5bf52c131be --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:545504db6ecea114f7e3b483d75353bef49c2055ba8c16847754f7cd07404aef +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3446c4dc5956fac9f0488731a681b7561f8a21d8 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b9b31dd45be3c80b1ad573c033dd51ae7f929d56def1ef83b573dcba746a75a +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..309523fa66a0a65b5f30e79b4f881c74668f6016 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b33c9432a4b58fe8774b5f72a772ab62acb43a8713f05a2064ae1756bd99aac6 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..555af9334b1404dc41fcd017bae3f16a9fec99ca --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:967249324d2b8173718bd83e03cffc53b10c8e948e1206a2d066eef69bc8e9e2 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a87b046fbc9e8738e9e19657d9b54ac371a69bb --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:744dc6b9ec5a978d1515018002a91522a0c7e1c26a1f33e5c65dd3bcd6607813 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a243e44c7b9364711a5ff91a4825fa087aa73176 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d682ee5b6be58e13bf8b58a79fc3db7c98fae90d195f1982a918c5270de6350 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66343b331e791d5fbd58997d17b72b96c569d37a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f2ce62cb0ac55d3f84833c1b98a6792de7abfea5124e877566c6bb01f0160dac +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93d2ed6e86ec9d2a69f046097186d6b8acf23c4e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:18fc38b3a84d62d1aaa8e9026c69c79829213b937179562e40381cc5552c0e83 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f25e6b953b0dc4f6db8d13e64712e38ad580dbe --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e503f5f86ab87b92a0bfccebca731eb16e27660fd28eed2164a4041ed87cfee5 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d1967fcff092b56156138e3b2ad090c28ffd37 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59c487c0f755a92de6d551372feee940b110a1918fe47d87befaa82ce6564b9b +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c7e4b3226894847aeb5fc285f5309c6a989eadb --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baf6dcb3e554461b966788f4f373f1f92e053aba2a0519b331e64af67a48daa8 +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8365f774707b083c2636b9a5adf41ea351b9b7b0 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d69747f71ce82186b2a6b1b2be84b551cc9d1fd8e2dbad7b6faf8760055d9807 +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11a67ce6575659581d2963f9c1aa2a846fd6a253 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c986346ff59ba488f3d25adeb584c1118a65631217e9df1dd4ee09a7488c099b +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64a6523cf3ef6a3eff1f86a84485e5b0d25e26c9 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:344c551defca86e8c320caab1c9b2c477c86a7ba61fda454be8f960c5e0eec8c +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64d49c30e5345e901a058811194809a4c9f66714 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b90bd356d5061fb95c6af7a5243d2689d1d55610b49ca4a3e60e44f9928e3211 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0079d83e3d73baf1f7718ac84b3bef92ecf77194 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ec06c25da3b9dec30a53d5c65721ee89145b699f4666e11cf26d012c4a11e80 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..919f010361a1e82be4b37da20906dc011da8deb6 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90849523c52cb8260a86ef61d1583da53d062f105f7256bad82618d105a294ad +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70c3d0ecce3b4f5ec77f04473f2692a04f6839f3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a60e7d477fa93af2abdd7e9867ca3da64d9aa67c538d71bb7821aab8cebd971c +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebeee3142e86eec65955102ac60ca05d0dca17fe --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c434d9361b20ca8e90a45f810687ba7cbaf94da648d3ea33264ed2651c15edc +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a89e9336896c402dc64963eacbdce7d92ab1e905 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:597e24c7d235338511423635a94f8631c73c3561ebe1468230ad9f692f6d0dd2 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e77b46810462975c8bf0638e1e79ce42e35cc05c --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6443f727c565e2645ad9b038069c12ab654c79aa9e1032b6709c5f4b647bd944 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca03b5303be8417ab0e443b9284ce0833c3a7e29 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b6b1ea9496cdc0d5366c6c38fcd731d16a005ee90c819a26f6cbe402ac40011 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffacd57a72ecfb9573cb0ff07499f9d86426a798 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d19ba10e4721eb9313800b3c2d864956b096bfa2943538a154eff03781be819 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22148198ab3c4b715e6cfd03e82b8a105bb71936 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50425b5afa30868ff37bdc97e9879bc635fd59c142d363db06a267179d074ba6 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..946eb15a21fedf4a39119317fcb73895a956eb7d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cd6ae1a7f9d6a076ff9a1e697b368fab3044c5d18e8525ee9de22842f85badc +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f684d49ccba10e09256ab285df76937d98416c6a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c52ad9f17bdb3a94f36da366ae53178bdbcafb843edc5760482dfc58840656f3 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f53dce7802ae36d28688e0bbcb69727b70906154 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7c5230d7937a5f792d0af3fd78c48cf0514467224ff1fe91db5d2e32bfdaf3f5 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec7d103651196b8d027d32d249c72ca5795fd944 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:05695a05a2b61b0691e433fb9c36dcb019385f5e2754bd9559a8c9e6df84c429 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..685579f5720713f82b043d025ac847f180d0bc63 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c64e622189da53baa9a518e5b7e6920c1df4143ba24820d620f59419f6b55fc2 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c15b7b8737f14727162907a86009ba3cf3f5ff5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03b8b388ed130ebbd0ad5a414cd37bbf2dffeb815e9b8ee767f53f5f5613ebf6 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61ee3dd027d50c8f6839c55e9a8f68291a60c9f9 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5eb241cc08e163dc1bfe322faf04f886e514e0a929df63511a81bbebf0ded2c2 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6595fac825ef06970e868aca469cf0ff147e95bb --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7347d25b44ebddbc97b214b52a155b94e69b95cdd1f01bc513a73b13bd11d0d +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..073ea93fd351e6dc9f6c02fc5d11d3968b5fd355 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6d2b29b5cc582ea29ddaa8b14cb591769ac8776c64781cefe2ee679aaee88a80 +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b16f4323cdde9614890ed97ce052e35988c318cc --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aec83a3078feb9e6e7407f304131e8bc64c7432b66585d040097fbc71d0a8d95 +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a79d51a6b17e69be054dccf6e86d06620500db2a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fa5b21ae2fac0be2a3637e547d6596070f375536491e2290181119821389c01 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56ecb33ffdb8bf76c3774f1fee9656d9b31553fc --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a5f66f70d8d49b042e6ada923b193ac4c682f41e9b641e85c67f4b65b326477 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a0d9f98d30071604c5862a2ab28dfaf38f2a5fa4 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e52d984321a49a1872ca6dc3ae72f12932ba4f804ff43812566245040b5ae5cd +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e5cfc708f7032880043b252a3064f5f625a8b76 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a87ae200d25f513fd073288eb100e36b8c09188dad8e7d30a4297f8240e3daa +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ce00cef7b33961fe18beab56f230877e994dae2e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:809d263e279d4c712c922f5d9ea432f292aa668a19b47d2f6eda9f6d575860b0 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb028813d7c7b55495091b261126725744a87d34 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:255047277f17917b37be4e1ab110a8ba2c2b4762175076212e2260693afa4d2f +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c800e6641b591f5a08799a20a472de7ad8699326 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a60efa4c1811c5a3fb6e89dbd7516f0a3f670b5d6003e832afb943535f7a61c6 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6b2d491fc2b55a866a273bbe03721eb771351c7 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:377cbf108a6427ea41d9ba6f9ab5a1d45c388243321d9dc0d14bf5525d71fafa +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e22334eea7e8103f960e9d5b63822f8bcc1fc5ab --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9fa237d8cccd4ca78f5bf14f817c3e88e92a06d8dce91d5548b5a034b4cd306 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3a40be502eb0cc0e73d9a2edab81f7075ce0292 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cbf0506d295b3c5523ccd9f8561e5e00f0850d00213e4811554b17cc931343a7 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db4d451e94cb846b14fda50bbcea2f213fcf47ef --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5bf6c63847dacbefd7bd92e99d90e2e7a50e5ebaccfecca3cdafa871aa145cc7 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9981c4370a6c6dadd3a231555862bbf5483414b1 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97b0fb22cb02990fd4d755edec33f12a112089f3c027eaf4496257231162b7c2 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9970c6139c7511e9da44650a9239be681eaaebad --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6101c30a37e4295ec02cc1c0da94c6f3b3a583c2b92a8d3de2a25f9e5463eb47 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c68a3f25e97a5f93a6232ae28a4024ddea39801c --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:28f5de4226ad6cb217ad757506086d3e1c8443b372a4c276aa039f501bb24824 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d59579487c601b69983095b9ca037a6e8f2a3817 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b816fd888624919d4dd269e69a15dfda9417d5ac0407ede9ad0ed15148e07e5 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..057d872ceb032e48105ac95a8fee0182564c9f66 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d488dea8615ef1d34da1ef43bb1fcebb085c80dfd2dfaa8ebd7fe8db206e15df +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fdf04ca705d089200412d4e5b7871c05234fe7a3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2808a9d62d600a8e0b67a90139210aad32b9850f781ddf064791bb7b074706c9 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ce9a1520c437adafe10e88ca813857e846fcd48 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9fbff5d390cd729938c012c89e68a8a5b2e83c35b9c23da238e4c4f0dee3239b +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4549a8ec42ea9281db87e0238fea01a00c6a883 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7132300835e81c219e3a04f30ba1defc7caecd1e7fbdbeea53ef29c9bf464271 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52f87d82e28d1fb1b69502dbc7c2fd5af73fe446 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb7064b90c419fe8ac041e992a8c9d1cd759f4d60cec8c8f8100f27029bc467c +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8dce042b5b222bb41da3707571ec3d6e9f648b1e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:632f49befe48f587483f1491fbf2cbe1d4a7654331f1c27515ec54b4dd37a73b +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dff87d91aac3ba798f5787022923b20c375017cc --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cee1c1dcef25c3ea2eced9429e0ddc4bdbd90294e597000e637e04504deaca3 +size 199058647 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa767f19aefbf3acd84c9a0e4d0ca7ac72e32163 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eda0db9e43f9d90d6249debd4ab63c5377ef03be1807260e01c3c48254a19f25 +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0e7efd49ed97d73d3c0895ef590cd2c59f5b669 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f23e5147627e6bb7c91811b7beb59ec47845a84ad5b06192d28a5660bb19fa56 +size 199058850 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90598806bb5e0e05aee8b50f0118d0f0664bd8a6 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5643f2ee50f83fabd2fdc70e432e07a12d5c2ae6cb9242e5e54eb0c04eb85a26 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd68db4f525d39443fec15e02a9dc8e1f04c6f8f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce74ad5c9683e3397d012094182f1d7b94071584249abdf151f4ee7e63afc3fd +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9762756dbcfc577418656993df09d040441c50ac --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a1d9dbf2c3c5d75ec041bd6d1ecd9bea32feb93ddd3edb28e404fd961352208a +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d6dc9dedcf17ea66e944074f95b41c3537653b7 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:947d4797f9acbc59d570553d6a6b68d05fcb4bb3b2a5d5738cd2a4a4bb55b9b5 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5318c3664d6932160a2ceb2136be6a649736d770 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8daaf0580be5ed99b502bc5fab7ca026b90b41fbb7956021f5a721a78954923b +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6efb0c72f4a7872e22aa84b878426705b1046390 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9c838641db71b69523e16f72765606d2d454fad566afc938fa995cecc050215 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..621df3dde77cf3acb8e88521ce53f78a15a62b20 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2251db1b4613901101426a209c6c0a3917be10e559ac5d1b25f5bc4d60a0bffe +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0b3652ca2bf316fbb4e01e1c0442c3922e9d04c --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:496b5119056327ae16a75bde908ae76e7d4df467700d983d41eddf248859af96 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48ff09fd00994d51ec5c02c2a5167ecbc3a441a7 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ef3a95b13a3ea135430b97a42a31e32a01ee7069bdffd06aab6ade81891a1b5e +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b77d1c9a767fec29b1714d9195d3a560987a1e2d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a55670e52b011dd74bf6084c74cc3dea78457607f754e20c4923f08675fca239 +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f90531872b9eeed22014e49df2b1c1c331597a6e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5cbecc94804fbf26ba8c0b63b3462e0acd73a0df96c27c5f37c3ff361700227e +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b412b0433074079b661db476e93deebab4a41eef --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e75b46841875092b5783da775f8f2dd7de51499d48c09a150003be9463b0c8d +size 199058722 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8235b775e879c5cdc6355c847200dd4f13b0a4d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:858cce19638ec883085c5ca698f4b3934ae9a4d0a1768f5b2d6d18e956dfa400 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7f7803874997553e106f427ad757918df45cd16 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad3d946a61abfd622d42f573a4686c6cc0b8374ade65e18300c2e70700128589 +size 199058786 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c19778be12edd03375fc560e6499d7472d3274cf --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:184cf40cbc3483e4477c33e1169d9f61867eb381c1d660d2622544eff232a846 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e723aa73519fc145b7680cacbc4da0f0ba1ff997 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d46ad4bb30c9c9a518ea21b0a6365d651d93ba318df27d2117e57bb6fa0beed6 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6a6523461ff42bd87632da7085c8c32a8421d1a6 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c22db3176069ea9d732b35abfa7934ebb1859b7aebea5894048c431b916619f +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21c55b927e0f795e176cda23128b480826207fde --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1cd9e681663715d7f777dd9e197e8cfb04a23268690c7afb14d06e1ef190fb0 +size 199058658 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee16bb2e9c636c643d9213c358cbe87bd13f20bc --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d53f8427d860adb49029ac9b90e86fc465239119130df2afdc018d37e3a7ee +size 199058839 diff --git a/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db475849585c78b1a68138772eed4dde3b0644b1 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728fceffc51c8c7dadf0ca17fc8e9b14117da75ad7b516f4bada25a24ec88c58 +size 199058839 diff --git a/4b284b6bc4seed2/global_step80108/layer_01-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4031a7ae56bba83c514d672037ba6ada8edd970 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:536cbc99a0a35dfa2a99094f5a45d0fa87ce11171c483bd27861768b443f2a82 +size 167511299 diff --git a/4b284b6bc4seed2/global_step80108/layer_01-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef9db40032f24a69702747a8f897691f2505bc46 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acb0b48bbc8d1ae212b12a75f256db196fc3c2ffc30b60cef82a4b9e1db76747 +size 167511299 diff --git a/4b284b6bc4seed2/global_step80108/layer_03-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e784d7a117f27219b177049ceb2411c58b23586 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e9b0cdd1d131d9d711c012386a76ff2cb405801f5de8420a2d28d389f5dff8 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_03-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a61cb5b2134533db8dd82db8946d90203b6b9b8d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fff62c8cf39440ac492d8ea8e412250c4d3bb5c68b3f8452bc1ef892737a3857 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_04-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..deacf359ec8b98cf0a7c08f4b3c358f307628e68 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74006e1580b27bedfcba01883989be10a947855c12177b187a59a9e28e45ffec +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_04-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2c260981ac22ba6f139fe829c24322723d4fb55 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2746cccb2d329f0ee38732917193f0d7972a095fa8a1a450820cedf308c64655 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_05-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..466f8362830f9d65bf0f2805b3bee0ef6698f7c0 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7213911d5da3c88e2c51334ffeb6c6090b6cb266e916e5ec5f6a8249f51ea0aa +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_05-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85cfa6a156c33bbc30c63cd767018e9aad1297d8 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3669d0f94a70b9d07fea3ea2cc2bd3f01a5e0fc6fd4a8dbdca53b927a7191393 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_06-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ebe51555ca3d70dc6ab1248c099694c36a795145 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93a825956d008558ccac28fb5af01da751f6f666ec4bc8fb8040b8e7c2ee14b0 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_06-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5924f41a2fa011659307e74b0ef10baf4ca51ef4 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bb128cce27e6d08f34383dedb3b66ab53f56768e940610ab80396af8abc28444 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_07-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..709fe940b0af2b957f56a2d8073d604ba277d566 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08f87095de76818874d6056ed54f33d1e89cbacebcf1be00de79f076a9a16c5f +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_07-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f49bc42538db6c97f273f683b56e9ef6d2ffb1d3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2624e511a05915664fcacf24ba0b5c6c3a58a7d19404a7c88d4fa454dadef0bf +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_08-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2604af960b52253994145724a554f9711e5a0637 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c453609ec6a03cb78e451a11be000a6da99bcb9adc36e1653040f13824c1c50 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_08-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2f0b4581ca14fa4e790f0941ae01e2c05857113 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8eb67af554e81562d6567a39fc4f42903875735cab1221a5dd5e1d4c281cacf +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_09-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9df57a99452840c866d6fe0240b08deef30b078 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8eea69e937e39399defa5fa2c5b0809889dc65baaa5277867c3c9f46facc2aff +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_09-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e1685cd53bebe53341e9e09aff493d53deeaa01 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bef075d62a5e98104d1f917ec9a1823a96abb8bb2cf18351cf060094fb46d524 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_10-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c9234cde122b107ab79009d984821910d24ac60 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1957fe049c3fca28859ff1c5b8ba8df90c4284568059763081e7054468b06c60 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_10-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f7fe313b4bd64dc370f0d850d4f5248c268adaf8 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:624e1c216aa2a6c92c7ddffa71a629bdc7110e988890f45b20a1bf8a6a80e1ec +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_11-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71467f221646cbf32c4f1e15a06f4048bdd8236d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d66fa2f86a45729631002b53f9192fa55f7b3b86ae7cf072df61171bbc7cbc3 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_11-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b0bc7a2b02edc77ac1fcf28fb8153a9424e52ae --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dac71e3e760ca072a6cadf2bd3ca4bfb3bba8b762a10d5e5d77f3e399ab2708 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_12-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..03a2dd4de94a6dcd9c3e36a0ba2b94379d7ae73f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed4f8983564924c7c6ae61f56c479b1b85da9207758510e53719a8990134b0d6 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_12-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25cf4cf26bf9fa339e7c16f70189a7aa5fca5259 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dec3a3ddfac71125534762f718487e5826149f8fe4c900b4cd12887efdcdf2c +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_13-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a59af3bcc7d8d13e7c0596d4714c05752fec30c2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1086b97cd7764e987f6a8ef0fd98949edbac0182209a6c107720fbb05dd8f7f8 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_13-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c03d2b01694377475a14f784c020f9d58ebc309 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:16b73168248f79ef8adae23ca5a1d6f645fab92243d855bf3efcdd19c4423a75 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_14-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee0b64622810a3dee7c4326df116002467601daa --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc742983962875beb4844f4767fbb7ed5ad9573cd73fa67681b867eaafb63ecf +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_14-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69091a1e53a0a7feb99d73d51ed9fdb5060192e1 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:061a2f9bcd61074a10266dc8173a7cddb661429e1cef6f8ee0dd294cd8731cb8 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_15-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2438f8610a8fd90dff5437b196302e01b3ff8e95 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f6707842aa83e791dd851cc812b8ed9ea087a680c06c65f87406c83e4f0b08 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_15-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e1fda00aea7dba573e39b6783912c6e2b37e383 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5e51a62b6a86d0b9371f102d5e5a3bc22a0af0ebfce3a1d69e35939b9ef21e7b +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_16-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91a02ad732cc5deb066a7e1155f6df8d40436902 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c728790152c0cbcb54b64031bb44c651c161851a41e948a015f4e3058aef5a1c +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_16-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a18fe4a3b80d0b13576094d5bdfad6c3255d400f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48f6e22ea9d546b920c060e235446ba0b712b11ac4b0c3aa5c7e3183605c8c85 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_17-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77c89e824e3c38bdf3d5048b422cfa6f8e98a7ba --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d661c20ca65d1061c0a32c50af6a8b05fc29d8ebc7779e51c649d490de52d856 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_17-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90e627c888df94d51bad3b5662da33a0b7dadb38 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6696bac22b96a18f48ef207a7253146d6f7d0ef637bf3a89965ac4f16ddc5f78 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_18-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..358b7660a120d7169d664f10ac7f30978fe45111 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d2c4419977517d0a585a23a2884df7048239adf785785d2ab31c3224aaecd66 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_18-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c54d3784023f12e2d4d67b21ec4e9db4938848bc --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b860ed8c78334960976337dde82cf91d54e39cec987072634467b6e3c033a11 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_19-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5a2f1d2e481185012b448fb0c9cf057a4bacdd0 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:544e059bac436256afe916721be57fd004f772839c825962418c35f75e2aa0ae +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_19-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c50faa6a3a055532f4bd5664c5eb0de8ec39f84e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a43c2b97dffe61af5f029f02490385f2b1626418eca28dcaa7d8fdf15e565edf +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_20-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1359245ec3af5ee5f526580c23a34a19b0f5abc3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ae5e7e025c320e27930cf8bc34f6f6d844439ddce5df1c4ee4929b8db0bb4ce +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_20-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9186a87fed33cc27d952963d5b35d47036a36474 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2db5e9dd8bfc5fa9bd40b12f7ac20eae4b98420a424f8e08346387c16257619 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_21-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf3ec8edc23912f25c0df64962280b7e5e1bef96 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b8c172fad76f4da06b6ef3c04e24e42eaa1428199bbf17cfc695ac6ea821a09 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_21-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee09fe9b76c8268952772cabcb5b66cb939d5d9b --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9a3badade986cda6d9d5179ebd3db440164e8713eeea05b3a96f62144afd839 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_22-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6661622a00fbb096b40ff9d303a74c37f7ff4360 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:543a82397b0ea1003f70c4aeee32d0bb7796f5c60be6bb62c3e199c195f7d279 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_22-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..00f8a5d2b478ccc0a4cb8a82d4551f46dcc9f110 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e762a0b3d595d7ce792036eb73a7295ccc4e737a2435246dd95c6d1afd25332 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_23-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e8e0bc3b0ae8081419802b5c2aed02064b6e48d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f2829f085bbee00a8d429e93912e6fac9235e0af96b20f8d49c068d9bfd4c35 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_23-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3784278be4bbaa253f019bbfda98910908c59e15 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c23d3e20f7676330f68500bb905238c6f380e9697fad1ee745cd061f611f4e63 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_24-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04bc1b3cc808546034cbf663fd283475c6fad558 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d33684c3178c7ec99eac446debae11ee315a5f79fab477361f25c05af0c31f50 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_24-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8fcb79eefd9eeeeabab0998066c1d89d2f3b06d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:506de0c636d474aec1be5e573e88fc83dc1359131ee2c47ab6475590dd012508 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_25-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6c7e85eba27bb4905aa7fbb3c070b2a4f35e5358 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca3180fd2fe596d62014706f3e3cc3d963db23b4f5040f3f9b8d46d0a5f24782 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_25-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a050e2e9af8a984877280d204aa05eb3543a5b74 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b34a13b4ff9f3db7484f782723ed139577aaaddfa60afd3852e0f75aacc30be7 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_26-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2758f19daffcb63d8c7c733555b3eba52730b7dd --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afdd358dcc1c87d366e23b53af3938adc84219887aabe7949346dfbac82af748 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_26-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b55d826851d0bf449ec35e9e786b0266fad1803f --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a05ed6dc63953441be416618c4bb8d4146b0266448093985b7493ba2c794430e +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_27-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d4aef948c170cb62e41e40cad6483342578b27d --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f2c6595f9f1071cc8abcabbe1c2eefdcf4a9af74fec2f7a78e99891b84c916 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_27-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..290aab8d1fa8a3fb0cec4af1166c51ca7f14c49b --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:659ccdee5b88d2605d519cfab95cc9fbb22df48d83c53c1e8e222d988a9f672f +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_28-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0d1b8c7714f51802ea73b544108f2242a8c1bc3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d32a0206f3c2121dd77671ecf44c9d46b5d098313308f59aa5748059a03c718 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_28-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d097ff54fbd7402ca66db697b8eb5b5e62a585eb --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c91c34ea16e51f8ab23d1890ca2b8cabccd9609d24c8b7ec980318a94c37971d +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_29-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..432e1379c8eba2ea60e28ea11a62ecd90e5228b2 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab977fc47599eaac1aa0ec0dc9576b9cf2f40c69c324aa1e42d02c4acc8d6839 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_29-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ae7b7fb1657ec30c16c173bf593650c302daed1e --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:943712a2b745e168bd57b361343e4597651709fcc0138a75fa37cade3ef96b79 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_30-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a1f3c3b63a613e313e8582991729ad364c1014a5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:598ed531f6a9e5a54773be62e73700eb8e3f8f4cfd5e5646bdd47b15321b27fa +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_30-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ca4e3c1d324d1337f6b13527f520af6b01fbd35 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74f96582ed06da71dec84ff2158b7cf72300edd0943009177d60004cf76c668d +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_31-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09db8efae4b9ed6e3f2e7d763157e29d57ec46ee --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f38d9c558479f6ad7e6490e233685c8da17ddbceef9c19ca3cffcb8bbecaf4c5 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_31-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a220bbfe9f4ee29e46a0183578150132402ef49a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25256b1eb5a659dde14335cdfcde1d144cbc03a690aaa3219b64672fd37594c9 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_32-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..efc32602c3417723eb80610ac2477d0030491601 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91acc06b60eecf7c59ba78d85fb04e0ace71720c08c704a96c387b972a5ef50d +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_32-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3912d2f455efea4b59200de740989a2e77df8454 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:921a0178300431cc74cae961805a48fcaead9af2b4b3825ba3998a3c186048c6 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_33-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ce624bcfce6bf81a8cd7d5ee61770ea1333f1d1 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32e0e90d6cc00650e2059fdb07dcc9119df9fe13fa0c5b1e8806c29c22563708 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_33-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..64ac99df3eda78f6a222fb2062c0b2657e42ada3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:189ef59c6e07ff3fbcc9abc777f9c2f4cac9cff61d2dba17be0b9a150e1560f9 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_34-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4687573e285b527ecc348a6d4825f46c1308605 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e81767ff80473935f830979ec7ab70f0ca574eb6183bf553cc63360a0c2c2a0 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_34-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aeec41f14698496f3d2def707d9f2a2dfea457a5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7888dde1538964341f1a75e057230f3a118c9ea4eee1590183c21bea6a079e2 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_35-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..04cf9ecf0e477316051ce664091a67f52c6759a5 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7952499852f0f7616868519debd1bd428e9a18a323d38ac9c8cf2a12014867a8 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_35-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e96af0fef5f94eb22ef506795d1e75768dad59d7 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f72b04b9b4ebe825f02268f03fcb93b3452f4c052e43afcce0314ff8b721967 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_36-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9163699d9508f731a7d28e849f8111e3c94e9769 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b84d380a9f41bb069411089b9a7659c2cd9368c2a8040c237ad00dcd7d096c00 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_36-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2619210162d96ae14bec437834e4ee751c2242df --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:614eeda8b96dfa7f2212ec3b7f65bb02112b5bafbfad173f68b1d692ebd559fb +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_37-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86faca4c6e379541c58dafb39223987582780f27 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4155a5f84cf1e7f42fd934441964180bc9c7deef244b95c372f6f0d1b57ee4c +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_37-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67e1f94c743fdc04ed6f54df4f384769f4633b91 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ecce4720565dcf6cfcdf7df49cb8fa8240b89c4cf6f0d92881a524e3846c4da +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_38-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9636a0e660caee86dfa0331ad6f546b1a6444794 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ac9fcde444273b31e1c0b88da73664de418089f54d23ddafcf3e38d7e3f4832 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_38-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..678a184fbe4390bdfbd36173dcc16b8d3b0ec2e3 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3515246e66f4c167a9d72dae2f6a07cf42fb5edc89218bd8350dd37cd32c40a4 +size 113308931 diff --git a/4b284b6bc4seed2/global_step80108/layer_40-model_00-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2e21b7740c7595ad1047d0a760d729cefc3202a --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:70ba90a7538c7b152899d8032f66136bd54a397e7fa2bcede9ba4a56194a46b5 +size 13507 diff --git a/4b284b6bc4seed2/global_step80108/layer_40-model_01-model_states.pt b/4b284b6bc4seed2/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb143864df2fd9bbeacf256e656a2beeb495d317 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29215cb8f6908a4f6bcd092dae35102db8b04270aa0778843729a88f9a3d41b9 +size 13507 diff --git a/4b284b6bc4seed2/global_step80108/mp_rank_00_model_states.pt b/4b284b6bc4seed2/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ce0815d2e517531a2bb9ce39edbef195a2cd976 --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2162d0d77e460bc393e8dc4114a40161db164b0ad7becd24df38420962773f08 +size 51443 diff --git a/4b284b6bc4seed2/global_step80108/mp_rank_01_model_states.pt b/4b284b6bc4seed2/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ad13320966a8d22ef6e95f7cfeb8b4559e8fb9af --- /dev/null +++ b/4b284b6bc4seed2/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3628b084d3fbfb48d00be58495fc93d763470680e6bb672b74943d0d5607a519 +size 51443 diff --git a/4b284b6bc4seed2/transformers/config.json b/4b284b6bc4seed2/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b6bc4seed2/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b6bc4seed2/transformers/pytorch_model.bin b/4b284b6bc4seed2/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..10440a900cd9c7e22700899d4fb40acdf8b1486d --- /dev/null +++ b/4b284b6bc4seed2/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:667e84c8357ff72554bab0c857ab44b058bedef33ef740ec9889786c5819b1f2 +size 8781203669 diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0db102ed3130358b2dfa9bbc16a5bdb9d829777d --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.32969762409287173, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03350207893898449}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07489491650147996, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001916354345656983}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.300291813063712, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00461536297454604}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.10919706809885917, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021601422959730493}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03439062652684824, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011545837032529334}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.14370713443920666, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003246173363178369}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05063701387421738, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0013546648556391975}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07070012219921042, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017208007855753348}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.2895484949203548, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0044970181242023404}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10382750267360731, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019706115754186356}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07104242339944349, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017912432501280336}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.2857359841499445, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004341838499174088}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10361568313155001, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002010621664327297}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..eefbb22dec81487a225d291701820be09eb5ebb0 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.4359939783272789, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.041779670416334125}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07266279503165236, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017099935201375816}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3475964219389317, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00506748933764113}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11088292832283875, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019702183179370605}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03335287604120367, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001128095255122388}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1660344328298045, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0035028476813622595}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05068936829455799, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012538981392173827}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06772928954103168, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015712765252988345}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3260811514542075, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004710148749523479}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10353647374043018, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017861554904427183}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06867664726380934, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016318384908350385}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.32775048198841006, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0046848102542069335}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1047015599685259, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018609963369853742}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..09ab2584478abfd399264d8c0409c4f0d63c1303 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5047753641043208, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03242172296180824}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07334706790054754, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013930615456138227}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3737700063497622, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005196576717483812}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1150888371627504, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018709716201208576}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.032868072571177076, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000815253916940581}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17803179222143828, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003604190340424885}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.051840665529172124, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011509985318477927}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06734503744998965, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001233876908858107}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3449240970361082, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004694373882052961}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10581169764988507, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016601816301532264}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06919868166026465, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013042029174787707}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3526754078681369, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004836506777085055}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10857869554945465, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017505188501646559}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1b9209f431791bb9b4bbd2067a4c0298c9f02a7b --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6249385322673848, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.023211819786736334}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07372614912850947, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001359300603084539}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3888611122018525, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0053578637277047906}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11637468420417033, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018331195406713198}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.033416989091581, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008041939460804035}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1903256864921483, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038053895221829945}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05316112071013902, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011465281622819825}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06697897307455199, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0011891190081388082}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3547382398864492, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004815238098721177}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10582598758235875, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016101686735076229}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.0694765908871884, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012821064008090915}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.364488357943653, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0048866912766196875}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.10953693694712942, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017209757445741357}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..ad111914999194569665a9433d55cbe8d0482e86 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6172877259530323, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0352446996928639}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0748843501395415, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001381267162660691}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39598227128772256, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00522226055907367}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1180321735790567, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018211841415573945}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.033363716686448004, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008232905700585103}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.18904409931911847, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0036763179024498203}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05290384691957595, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011327428150165345}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06681400109757821, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012097158147883198}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3551645214739529, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004603707682826054}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1053542922815303, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015788673153327966}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07014407223382836, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013067256802706008}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3699177055550494, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0047899231539846945}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11042261394743104, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001708240502656495}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..6f971b60a9c6b8e25b732548b0a21f29a0cc3b8a --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6739230942233659, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03781903865026685}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07434118591062619, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0013606852466120714}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40517103911737706, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005207962506245739}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11775202851872192, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017322424295727937}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03309571045270455, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000762355738688032}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.1960621498928731, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037598520682319884}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.053092972525274194, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0010965950400499984}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.06663527060233249, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001226540610105808}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3640849747385268, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004640046414372116}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10543601362203549, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015178302726180323}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06962894335162277, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001291561351449583}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3794277979681509, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004818380083375467}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11016000573694927, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016169723040308337}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..053b390281050ec4ce3947543e91d857caaa2fed --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15541888954389302, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018896399566670286}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2609485104955259, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002636869555478932}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18074785424679843, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018330825958722083}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.031340296740352346, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007364805410626298}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05475940923731912, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0013900561092136223}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0367425698800636, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008312312379815959}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11824683156742628, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012988846637495886}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.20619299633996296, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00212551360652741}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.13925315500169771, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012900858881895007}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14243870027384645, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017153432680596468}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.24072866043059984, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0024483585527040877}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1659756245930406, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016665877399642023}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.5656365853870153, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06994438419251063}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..36f6e22a2e559d2e485c47d213be7c3a8823cb75 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.16880681390038538, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019611277767498836}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.28525722098489775, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002677390028605212}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.19671251716356983, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001845617511049733}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03604438137203516, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000869171473451728}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06302505515896178, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001516286602693054}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.041911863785581135, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008870741133490255}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11944422928337016, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001289252852685886}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.20967875473639086, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002077526143241249}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14075220661179533, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001215604718401757}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.15784656842847097, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018258770460077972}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.26803761801382864, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002534338768264281}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.18414503390476486, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017143415167847412}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.973383093888403, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.062022250654948985}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..3192211738663dab73174f10183697737d866ce8 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1736169708012349, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001996587278110062}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2912556116042534, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002623711899034249}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.20072566114135942, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017824984220287418}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0384761806811168, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009080570700775258}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06572148998847567, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015105024802730654}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.04387417540357548, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008841272873745032}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12265905134544655, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001362079458617771}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21240429042053888, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020452824149258956}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14291058225462885, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0011859440485204546}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.16352244262880908, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018872605104035078}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2749190558193557, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002492631782723321}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.18905151622482155, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016692502782787643}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.1175282747257644, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.06998742940696125}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ca54c36a11b4d3eb4041220120f5186f46123600 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.14882059286798324, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0022373461300931904}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.24050957204964596, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0030817740969047145}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.16643706321643362, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020704146578302326}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03181983589104918, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008484419112906057}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.05484288322789256, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0014960971078962267}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0361752103611802, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000867704104426404}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.10654366188722789, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015926951137942584}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.17705682236326656, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002371382040095437}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.11962154613019327, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014270812276544398}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14031012069279475, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0021128033295454685}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2280011194950691, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002945699576253965}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.15701568648694605, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001941607990077885}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.1104572563587314, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08130929312280372}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..0a54ee560570b0f2752aff870e6be53b0b9acf93 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.04882282454207474, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018421430903010254}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.07876047438791374, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002697214616618726}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.05291772897577509, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0017907780517303251}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.01077293516300109, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005917384833393335}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.018348282948383934, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0010183488719467035}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.011760404029928792, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005829032307815198}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.036110109432090025, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001374477701533682}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.05971330398388186, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020872379456574647}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.03910342186337772, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012989884715958904}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.045926119483004395, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017391323394054688}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.07417627776667039, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025389281954311367}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.049731919009013095, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016762102641413167}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.4691224289773883, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.02668327939721337}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..fa32b2500bef836429ebf4f4f31f7377e3fc5496 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.00810456902224064, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0008295622235488356}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.012892068442699021, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0012439840243997097}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.008433400400641064, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007845519354746148}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.001717931713356291, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00023161121403494434}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0028267780226751624, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00038800429271119996}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.001800717466655775, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00022472022265705173}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.0060439886510759554, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.000615759737534485}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.009783049887326086, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0009727833840458493}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006285400183131738, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005802251499635472}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.0076696483874971145, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007904189857688219}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.01212609963804329, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0011678377048075187}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.007924335842795362, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007327104926757877}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 9.290848886467249e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.7114521557633313e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..7824b7a57e84d2f3467675996ee901c8d4a27d5b --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 1.2766060742328618, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.033382297496973044}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.12547708059065077, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016991149775388303}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.23286096473540036, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002096871122935081}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.15467556742530433, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0014870962026354128}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.020679772826704766, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006689218506654367}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.03586683743869036, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0008739755877011557}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.024539136332226045, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006053943117133528}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.1237352883610742, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015822386288611187}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.23190983665582457, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0020952712936508694}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.1535691608718009, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0014593610156894993}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.09629626695764527, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.001458815570353432}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.17660986438802767, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.001647260183147006}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.11750764811037896, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0011824353244648067}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..59da663e8b45d317e79429e93bf63fa7bc6c6ac6 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.971524127225308, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.10544280951045465}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.48231110383057557, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0032247228835386517}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.403997228531794, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028600003192301073}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4113655457313639, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022474772878560124}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2130032822750816, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0023661910744460224}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.17583012878246712, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001978305147161013}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1793035326067927, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018252903214182239}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3479327379612941, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027285680175982486}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.28935051237673826, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022709879114623396}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.29475151710386843, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001863428554324611}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.39081628521576756, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0029962237793696206}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3259151337760425, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002573842992772049}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.33218523237694836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002132622458139582}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..4495a92862b1faeeefbe39007f2cc4b9033b5739 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.009017189958726, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11145987575879608}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5147310358802538, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003396653197723534}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.41720988690209326, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002792457559765853}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.43104311865962835, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021779427028603892}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.24498889329212936, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002608508121965644}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19327099949467277, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001959163536842046}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2002542357997297, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017902090129902814}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.36812722202759224, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0029336157567466338}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2964234427792765, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022900011257602723}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.30590576351723786, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018552213291573585}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.416924976940603, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003204078619564438}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.33621578141510805, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025598541840636643}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.34760227841277236, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021182372608920443}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..852480ae60b1bc3822695021e2fb1a003ad342a9 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.37013872681925, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1248535458793912}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5262376572196412, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003314216010987937}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.4203811757292955, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027242623347569794}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4382518972315406, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002120900374137443}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.2555054900714246, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025360200082144213}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.19936173892529557, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001968228951567367}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.2083080407376916, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0017923004828278104}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.3705189491307532, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028470148719156275}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2958881905119737, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022971405804365535}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.30745568780724575, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018843522431812505}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.42642680843427827, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003136183576523699}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.34024569366071405, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002549897845983359}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3545216421140483, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00212376511748824}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..9464e2be943b5bc630b56b1a2b2bc235c3318304 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.765340533551441, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1912402786333196}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5306810580993595, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0033851394123312253}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.42528611686964685, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026503481090942404}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.44393544366679405, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021690010152583634}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.260418105723064, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025790052457071106}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.20445058835077626, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019669109848647025}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21381876391107585, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018342178017127435}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.37225379044451273, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0028559068973251483}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.2989580220460878, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022621251801345312}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.31075327922766594, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019052938372683594}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4312812867418651, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003185050048493793}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3457653768297206, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002509286441413888}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.36042783225590935, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002153038065829124}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..8142e3961e000bbc5b36e6a3e90236134128af6a --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 11.642699930069227, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1665369304874196}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.5325771024895927, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003324417097878668}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.423375363663033, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002579776398819506}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.44527849888326165, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00212920846401032}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.26000882478166104, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0025160583279758833}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2023827705716057, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0019083505179989817}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.21356366108349217, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0018086595084145472}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.37345338410021045, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0027850387825540343}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.29841219926012585, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022412056697221224}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.31225656411530295, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018997774824826212}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.4347592206047231, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.003147641490452167}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.34531753802150883, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.002441753077630109}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.36317108046262075, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021475431353111018}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_0.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..c9fad5c2c6fd63ba3bb17c85924b77c8e78a534a --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1710772835102388, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002582017048828936}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.3373740585909959, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004318919243908899}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.2156420598991778, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00263185112572885}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.03815200927229576, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0014072364633565078}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0786744064818293, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0026804574552702818}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04884054932435322, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016585250835702103}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.12754160270794315, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002011334698725272}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.25334667587072296, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003450143632066797}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.16101456985244528, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0020610939231262555}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.13385208533719228, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002070645698817516}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.26848842566929143, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0038523767507661405}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.16981783764753203, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002226137523389508}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.0741395710975095, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08597567591183493}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_1.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..4b2354b614acea0ddf6a8e31265de2a67d09af86 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11227417163381835, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017039218550246112}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2797248751495629, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003968857163602909}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.15837125050520046, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023055850072850443}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.018669833521043514, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008449378560881147}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.04827881607393628, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002284155004021152}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.026630545400190872, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012106703751066281}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08743651997872359, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012692664754791996}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.22012328317880311, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003179126144947638}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12365741491966617, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001744614390045227}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09091214915987274, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013821688490987276}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22855737113252247, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034018065673890674}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12855514629984804, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018970590100685048}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.1246061582895406, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07747059021612675}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_2.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2a453351ab3cf5567d50d4abd51bd63a07879c13 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11250317157809601, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0016800664803736658}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.28113282823526276, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003945997628456255}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.15883481893910234, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022699060879070535}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.01896938772049727, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008643828022382121}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.049173235460005654, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002268647709705696}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.02705070058613688, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012259402316261174}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08821548713657433, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001257682577357835}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.22267200234218015, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003150822045727067}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.1248624072282009, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017218083377439604}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09143863793787037, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013675216267640294}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.23035645576125668, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.003395221254818866}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.1293633765948801, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018724040714540883}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.083987545697224, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.0951603405593235}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_3.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..470e2b318c50f1c653113255483d50c298b61e73 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.1135683171554586, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0018252408618523069}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2733846183658498, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004127294944074159}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1568851125966369, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023595898685490934}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.018441537770525027, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008593607153443226}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.046956157677330496, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0022480399509630807}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.025996659748247403, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001202554493648326}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.08824288636817447, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013936029206214834}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.21403488032801135, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033187592114637225}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12213531817307888, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001820148746643857}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09209123877139916, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014864917206167194}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22350234682822415, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00353686596355823}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.12753462874453708, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.001953792409491164}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.0722820327593516, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.09885521374509743}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_4.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6dc68b89ae129cf7b74aa4b05399271e6245ed5c --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.03474932144936362, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002201931313691675}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.06689455692536692, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0038788599391435565}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04186692901767099, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023656062725519998}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.005643400181474951, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0007048683985523554}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.012053130076333454, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001283667991361848}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.007066756182933345, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000727809037435576}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.02758638485788023, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0016907629167725257}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0531079976861651, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.003067848877689164}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.033123659489118114, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018362158780032708}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.029084229332332977, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.00179355123233279}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.05597642727155089, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032615168998855935}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.03498061599676034, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019684597857678363}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.5328790203575752, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08576903026751956}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_5.json b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..cdbcbecc0e2fac49d466950d0ba299402cdd2345 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/agg.4b284b6bc4seed3_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.002328789088383691, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0006187865720825858}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.00208064502929238, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0005621215174690571}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.002150076877118036, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0005715576930386714}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00010405105438401775, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 7.357743885200423e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 6.636445315690599e-05, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 4.704542030779156e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 8.081906797549185e-05, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 5.7158807305374844e-05}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.0017927242516879765, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.00047914637491014385}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0015642137359017942, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00041540866296455953}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.001640744777975664, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00043598430281185013}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0018939725840683842, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0005004552190432495}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.001635109178020478, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.00042818036276967824}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.0017214827651769189, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.00045046792515902423}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 2.2373133015544847e-38, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 2.788714232530993e-33}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7646f488df9845de8e73821e7ff7a775def91081 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a91667cd9b8b34601cd7c4fc40743fff58103385e443c633deacd31977a3d647 +size 4115425 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d27dc57e1b969a8dc4f98d38f80f633f717b078f --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76d9ba59044e145e0dbe7141c1660cb66ad4be3e6bedc7430274c3314cb8e242 +size 5097851 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6a637fb9aab5157812511c2d2544fa3c45e1174e --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:45f191d81964ac74b1d439e39b870db370cb5f1679ddcf8c02f0342bbe682c57 +size 6004731 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9fad35afd0ac3774d878b68c1ddd184f03670e15 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31a7ad04d9dfd5a1e63d4d7b816fefb7b1dfaaa2692836f36f7dd5110950e17a +size 6927875 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..ac4da9eb722b1190e69158b38885588fecfa5d6f --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9973434047f4e02be2c75302ad02763a800729a7a16603453e3fa98eeaed011d +size 7835076 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7b405655f8427aa646ebf91cc1f4550104b0d168 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f264eb4aa696b3f6ced181a1d2a7c6f7138d21e79da8c269c74479e62517ad1 +size 8743234 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..7c7a52a5ebbe286a8dc8c9950b315bda332b5003 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fae6af83ffe6dd83fbfca4b598b1fb0645ae4e993f64e929bb3634e537b7018f +size 7696064 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6961798a1919e5980144545192d06730b61f2296 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92d194cdb9771fb4061929210a8d2fd6a4b9a2a52d10fd874d9d4ec66a281200 +size 13322641 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..b153fab5b7516d24c7ab0cffc4f27a613c364439 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d6a834aebb69cfc4155388e8fb7423e588e7b4f48c79ed980937e8537a23782 +size 18927084 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2827e12826f4859918e2000f96095da12d26dde4 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48d316414907f018ebd9417a02c4d8cb0b4f4543b54acc607043e706a41b27d1 +size 24340375 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..385e565f2bfbb1b0072383e6eb22a660747f2647 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a81f9fed31114f466282037569235e2e7bc69da4860240455827f21a6f7d3fb +size 29476371 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..68e52f45e29d0fe0a39431e93da865d97e9266e6 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:929a58be740ffd6377e0682e98af2c42728bd79e3ea6342f2d54b32cb8c1698f +size 34800534 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f9ad96ad61ef375983198b1d964aa550b2ffd8a9 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e44e7025955fb569b21b8288e8433f54a207ccb64871d9614078ae7c4941d1f9 +size 4482416 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e7feb19bda98b8dabc76e1894562255b41985ab0 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a96f686e36aec61c59189384b61c941d655f1bb6e514407821b0f8bf3a2bb4f9 +size 5070189 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..92e7f41b5e6c3daed7165be54e1e4c1ec96db9bf --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4880e058d052caf0b0c7251f1bfc7690c14edbf39a1a08ace549a446042045fa +size 6148272 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..d2761788684fbe4305afe76a6daffe8747fef649 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:130878d5f643963927ddcfcf892e3ced10caa99a0ca77d677a8a553a2c3e3c4e +size 7226358 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..c3905f419b6bf89684b4403ffafcfda502b6809b --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43b1d7656317ea53a17e9f99f9b6c5dfba5ac77190a7a89d97d984f5c67579b5 +size 8308651 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..59999aab82e560214177eec9f86975c06243add5 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa621b8bf84f120c90c33a81aa99fcc91262cac954018e16d99aa1ffdf6ab4c7 +size 9389406 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_0.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..33868dc1dc7b39e76748d7839ba86181042b69b2 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a04440c8b76bcdeb90ca2321cb2b1a121ab8522ff18b9e79f4d329d1475e538e +size 2791379 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_1.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..da54879adac914873a1b41eb7df7c2d7e8f3046a --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20ea2928743e30711bb78c3ab8f3dd6212a121dc815ca814ab715f6b002d128c +size 5103838 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_2.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..81931b42cfe6033db8472bbafbc4a70dbc82c3f4 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:151519cf82cf75a485e84eb73f789a17384b13a706666903cbd56d67c5216a6f +size 7377069 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_3.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..fdad404b65dfd9cd3cd770665b21fc5cda78c6dd --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a344e487d9791014a508874a83209215bbec34c6c1259181c1ae7f449c884eaa +size 9645108 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_4.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..f9454f4e5623b37b177ca19037a788f281030df1 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73396bce875baf0ec0d9922b0ec4acacf9392334d9bf77ccf79437205aae9294 +size 11671556 diff --git a/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_5.jsonl b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..045c8df8faf11e55320979ead8a7190a46c14eaa --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/examples.4b284b6bc4seed3_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5155233d1f1c8b188f4477c3bc73d1f3e40e217482f8986e4a452642b0408834 +size 13897529 diff --git a/4b284b6bc4seed3/evaluation/generation/merged.csv b/4b284b6bc4seed3/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..f1f864ec09eb230fde8f4139aa039e9634449776 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.024539136332226045 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.024539136332226045 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.1793035326067927 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.1793035326067927 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.2002542357997297 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.2002542357997297 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.2083080407376916 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.2083080407376916 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.21381876391107585 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.21381876391107585 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.21356366108349217 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.21356366108349217 +e2e_nlg_cleaned,5,average,multiple,0.17329789507850135 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.04884054932435322 +gem_xsum,0,median,rouge2_fmeasure,0.04884054932435322 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.026630545400190872 +gem_xsum,1,median,rouge2_fmeasure,0.026630545400190872 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.02705070058613688 +gem_xsum,2,median,rouge2_fmeasure,0.02705070058613688 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.025996659748247403 +gem_xsum,3,median,rouge2_fmeasure,0.025996659748247403 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.007066756182933345 +gem_xsum,4,median,rouge2_fmeasure,0.007066756182933345 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,8.081906797549185e-05 +gem_xsum,5,median,rouge2_fmeasure,8.081906797549185e-05 +gem_xsum,5,average,multiple,0.022611005051639536 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.05063701387421738 +web_nlg_en,0,median,rouge2_fmeasure,0.05063701387421738 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.05068936829455799 +web_nlg_en,1,median,rouge2_fmeasure,0.05068936829455799 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.051840665529172124 +web_nlg_en,2,median,rouge2_fmeasure,0.051840665529172124 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.05316112071013902 +web_nlg_en,3,median,rouge2_fmeasure,0.05316112071013902 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.05290384691957595 +web_nlg_en,4,median,rouge2_fmeasure,0.05290384691957595 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.053092972525274194 +web_nlg_en,5,median,rouge2_fmeasure,0.053092972525274194 +web_nlg_en,5,average,multiple,0.052054164642156106 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.0367425698800636 +wiki_lingua_en,0,median,rouge2_fmeasure,0.0367425698800636 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.041911863785581135 +wiki_lingua_en,1,median,rouge2_fmeasure,0.041911863785581135 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.04387417540357548 +wiki_lingua_en,2,median,rouge2_fmeasure,0.04387417540357548 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.0361752103611802 +wiki_lingua_en,3,median,rouge2_fmeasure,0.0361752103611802 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.011760404029928792 +wiki_lingua_en,4,median,rouge2_fmeasure,0.011760404029928792 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.001800717466655775 +wiki_lingua_en,5,median,rouge2_fmeasure,0.001800717466655775 +wiki_lingua_en,5,average,multiple,0.02871082348783083 diff --git a/4b284b6bc4seed3/evaluation/generation/merged.json b/4b284b6bc4seed3/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..cb75966bd9d2a5e7385012fcc436fa94b39d1130 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.32969762409287173, "bleu_stderr": 0.03350207893898449, "rouge1_fmeasure": 0.10919706809885917, "rouge1_fmeasure_stderr": 0.0021601422959730493, "rouge1_precision": 0.07489491650147996, "rouge1_precision_stderr": 0.001916354345656983, "rouge1_recall": 0.300291813063712, "rouge1_recall_stderr": 0.00461536297454604, "rouge2_fmeasure": 0.05063701387421738, "rouge2_fmeasure_stderr": 0.0013546648556391975, "rouge2_precision": 0.03439062652684824, "rouge2_precision_stderr": 0.0011545837032529334, "rouge2_recall": 0.14370713443920666, "rouge2_recall_stderr": 0.003246173363178369, "rougeL_fmeasure": 0.10382750267360731, "rougeL_fmeasure_stderr": 0.0019706115754186356, "rougeL_precision": 0.07070012219921042, "rougeL_precision_stderr": 0.0017208007855753348, "rougeL_recall": 0.2895484949203548, "rougeL_recall_stderr": 0.0044970181242023404, "rougeLsum_fmeasure": 0.10361568313155001, "rougeLsum_fmeasure_stderr": 0.002010621664327297, "rougeLsum_precision": 0.07104242339944349, "rougeLsum_precision_stderr": 0.0017912432501280336, "rougeLsum_recall": 0.2857359841499445, "rougeLsum_recall_stderr": 0.004341838499174088}}, "1": {"PALM_prompt": {"bleu": 0.4359939783272789, "bleu_stderr": 0.041779670416334125, "rouge1_fmeasure": 0.11088292832283875, "rouge1_fmeasure_stderr": 0.0019702183179370605, "rouge1_precision": 0.07266279503165236, "rouge1_precision_stderr": 0.0017099935201375816, "rouge1_recall": 0.3475964219389317, "rouge1_recall_stderr": 0.00506748933764113, "rouge2_fmeasure": 0.05068936829455799, "rouge2_fmeasure_stderr": 0.0012538981392173827, "rouge2_precision": 0.03335287604120367, "rouge2_precision_stderr": 0.001128095255122388, "rouge2_recall": 0.1660344328298045, "rouge2_recall_stderr": 0.0035028476813622595, "rougeL_fmeasure": 0.10353647374043018, "rougeL_fmeasure_stderr": 0.0017861554904427183, "rougeL_precision": 0.06772928954103168, "rougeL_precision_stderr": 0.0015712765252988345, "rougeL_recall": 0.3260811514542075, "rougeL_recall_stderr": 0.004710148749523479, "rougeLsum_fmeasure": 0.1047015599685259, "rougeLsum_fmeasure_stderr": 0.0018609963369853742, "rougeLsum_precision": 0.06867664726380934, "rougeLsum_precision_stderr": 0.0016318384908350385, "rougeLsum_recall": 0.32775048198841006, "rougeLsum_recall_stderr": 0.0046848102542069335}}, "2": {"PALM_prompt": {"bleu": 0.5047753641043208, "bleu_stderr": 0.03242172296180824, "rouge1_fmeasure": 0.1150888371627504, "rouge1_fmeasure_stderr": 0.0018709716201208576, "rouge1_precision": 0.07334706790054754, "rouge1_precision_stderr": 0.0013930615456138227, "rouge1_recall": 0.3737700063497622, "rouge1_recall_stderr": 0.005196576717483812, "rouge2_fmeasure": 0.051840665529172124, "rouge2_fmeasure_stderr": 0.0011509985318477927, "rouge2_precision": 0.032868072571177076, "rouge2_precision_stderr": 0.000815253916940581, "rouge2_recall": 0.17803179222143828, "rouge2_recall_stderr": 0.003604190340424885, "rougeL_fmeasure": 0.10581169764988507, "rougeL_fmeasure_stderr": 0.0016601816301532264, "rougeL_precision": 0.06734503744998965, "rougeL_precision_stderr": 0.001233876908858107, "rougeL_recall": 0.3449240970361082, "rougeL_recall_stderr": 0.004694373882052961, "rougeLsum_fmeasure": 0.10857869554945465, "rougeLsum_fmeasure_stderr": 0.0017505188501646559, "rougeLsum_precision": 0.06919868166026465, "rougeLsum_precision_stderr": 0.0013042029174787707, "rougeLsum_recall": 0.3526754078681369, "rougeLsum_recall_stderr": 0.004836506777085055}}, "3": {"PALM_prompt": {"bleu": 0.6249385322673848, "bleu_stderr": 0.023211819786736334, "rouge1_fmeasure": 0.11637468420417033, "rouge1_fmeasure_stderr": 0.0018331195406713198, "rouge1_precision": 0.07372614912850947, "rouge1_precision_stderr": 0.001359300603084539, "rouge1_recall": 0.3888611122018525, "rouge1_recall_stderr": 0.0053578637277047906, "rouge2_fmeasure": 0.05316112071013902, "rouge2_fmeasure_stderr": 0.0011465281622819825, "rouge2_precision": 0.033416989091581, "rouge2_precision_stderr": 0.0008041939460804035, "rouge2_recall": 0.1903256864921483, "rouge2_recall_stderr": 0.0038053895221829945, "rougeL_fmeasure": 0.10582598758235875, "rougeL_fmeasure_stderr": 0.0016101686735076229, "rougeL_precision": 0.06697897307455199, "rougeL_precision_stderr": 0.0011891190081388082, "rougeL_recall": 0.3547382398864492, "rougeL_recall_stderr": 0.004815238098721177, "rougeLsum_fmeasure": 0.10953693694712942, "rougeLsum_fmeasure_stderr": 0.0017209757445741357, "rougeLsum_precision": 0.0694765908871884, "rougeLsum_precision_stderr": 0.0012821064008090915, "rougeLsum_recall": 0.364488357943653, "rougeLsum_recall_stderr": 0.0048866912766196875}}, "4": {"PALM_prompt": {"bleu": 0.6172877259530323, "bleu_stderr": 0.0352446996928639, "rouge1_fmeasure": 0.1180321735790567, "rouge1_fmeasure_stderr": 0.0018211841415573945, "rouge1_precision": 0.0748843501395415, "rouge1_precision_stderr": 0.001381267162660691, "rouge1_recall": 0.39598227128772256, "rouge1_recall_stderr": 0.00522226055907367, "rouge2_fmeasure": 0.05290384691957595, "rouge2_fmeasure_stderr": 0.0011327428150165345, "rouge2_precision": 0.033363716686448004, "rouge2_precision_stderr": 0.0008232905700585103, "rouge2_recall": 0.18904409931911847, "rouge2_recall_stderr": 0.0036763179024498203, "rougeL_fmeasure": 0.1053542922815303, "rougeL_fmeasure_stderr": 0.0015788673153327966, "rougeL_precision": 0.06681400109757821, "rougeL_precision_stderr": 0.0012097158147883198, "rougeL_recall": 0.3551645214739529, "rougeL_recall_stderr": 0.004603707682826054, "rougeLsum_fmeasure": 0.11042261394743104, "rougeLsum_fmeasure_stderr": 0.001708240502656495, "rougeLsum_precision": 0.07014407223382836, "rougeLsum_precision_stderr": 0.0013067256802706008, "rougeLsum_recall": 0.3699177055550494, "rougeLsum_recall_stderr": 0.0047899231539846945}}, "5": {"PALM_prompt": {"bleu": 0.6739230942233659, "bleu_stderr": 0.03781903865026685, "rouge1_fmeasure": 0.11775202851872192, "rouge1_fmeasure_stderr": 0.0017322424295727937, "rouge1_precision": 0.07434118591062619, "rouge1_precision_stderr": 0.0013606852466120714, "rouge1_recall": 0.40517103911737706, "rouge1_recall_stderr": 0.005207962506245739, "rouge2_fmeasure": 0.053092972525274194, "rouge2_fmeasure_stderr": 0.0010965950400499984, "rouge2_precision": 0.03309571045270455, "rouge2_precision_stderr": 0.000762355738688032, "rouge2_recall": 0.1960621498928731, "rouge2_recall_stderr": 0.0037598520682319884, "rougeL_fmeasure": 0.10543601362203549, "rougeL_fmeasure_stderr": 0.0015178302726180323, "rougeL_precision": 0.06663527060233249, "rougeL_precision_stderr": 0.001226540610105808, "rougeL_recall": 0.3640849747385268, "rougeL_recall_stderr": 0.004640046414372116, "rougeLsum_fmeasure": 0.11016000573694927, "rougeLsum_fmeasure_stderr": 0.0016169723040308337, "rougeLsum_precision": 0.06962894335162277, "rougeLsum_precision_stderr": 0.001291561351449583, "rougeLsum_recall": 0.3794277979681509, "rougeLsum_recall_stderr": 0.004818380083375467}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.5656365853870153, "bleu_stderr": 0.06994438419251063, "rouge1_fmeasure": 0.18074785424679843, "rouge1_fmeasure_stderr": 0.0018330825958722083, "rouge1_precision": 0.15541888954389302, "rouge1_precision_stderr": 0.0018896399566670286, "rouge1_recall": 0.2609485104955259, "rouge1_recall_stderr": 0.002636869555478932, "rouge2_fmeasure": 0.0367425698800636, "rouge2_fmeasure_stderr": 0.0008312312379815959, "rouge2_precision": 0.031340296740352346, "rouge2_precision_stderr": 0.0007364805410626298, "rouge2_recall": 0.05475940923731912, "rouge2_recall_stderr": 0.0013900561092136223, "rougeL_fmeasure": 0.13925315500169771, "rougeL_fmeasure_stderr": 0.0012900858881895007, "rougeL_precision": 0.11824683156742628, "rougeL_precision_stderr": 0.0012988846637495886, "rougeL_recall": 0.20619299633996296, "rougeL_recall_stderr": 0.00212551360652741, "rougeLsum_fmeasure": 0.1659756245930406, "rougeLsum_fmeasure_stderr": 0.0016665877399642023, "rougeLsum_precision": 0.14243870027384645, "rougeLsum_precision_stderr": 0.0017153432680596468, "rougeLsum_recall": 0.24072866043059984, "rougeLsum_recall_stderr": 0.0024483585527040877}}, "1": {"tldr_en": {"bleu": 1.973383093888403, "bleu_stderr": 0.062022250654948985, "rouge1_fmeasure": 0.19671251716356983, "rouge1_fmeasure_stderr": 0.001845617511049733, "rouge1_precision": 0.16880681390038538, "rouge1_precision_stderr": 0.0019611277767498836, "rouge1_recall": 0.28525722098489775, "rouge1_recall_stderr": 0.002677390028605212, "rouge2_fmeasure": 0.041911863785581135, "rouge2_fmeasure_stderr": 0.0008870741133490255, "rouge2_precision": 0.03604438137203516, "rouge2_precision_stderr": 0.000869171473451728, "rouge2_recall": 0.06302505515896178, "rouge2_recall_stderr": 0.001516286602693054, "rougeL_fmeasure": 0.14075220661179533, "rougeL_fmeasure_stderr": 0.001215604718401757, "rougeL_precision": 0.11944422928337016, "rougeL_precision_stderr": 0.001289252852685886, "rougeL_recall": 0.20967875473639086, "rougeL_recall_stderr": 0.002077526143241249, "rougeLsum_fmeasure": 0.18414503390476486, "rougeLsum_fmeasure_stderr": 0.0017143415167847412, "rougeLsum_precision": 0.15784656842847097, "rougeLsum_precision_stderr": 0.0018258770460077972, "rougeLsum_recall": 0.26803761801382864, "rougeLsum_recall_stderr": 0.002534338768264281}}, "2": {"tldr_en": {"bleu": 2.1175282747257644, "bleu_stderr": 0.06998742940696125, "rouge1_fmeasure": 0.20072566114135942, "rouge1_fmeasure_stderr": 0.0017824984220287418, "rouge1_precision": 0.1736169708012349, "rouge1_precision_stderr": 0.001996587278110062, "rouge1_recall": 0.2912556116042534, "rouge1_recall_stderr": 0.002623711899034249, "rouge2_fmeasure": 0.04387417540357548, "rouge2_fmeasure_stderr": 0.0008841272873745032, "rouge2_precision": 0.0384761806811168, "rouge2_precision_stderr": 0.0009080570700775258, "rouge2_recall": 0.06572148998847567, "rouge2_recall_stderr": 0.0015105024802730654, "rougeL_fmeasure": 0.14291058225462885, "rougeL_fmeasure_stderr": 0.0011859440485204546, "rougeL_precision": 0.12265905134544655, "rougeL_precision_stderr": 0.001362079458617771, "rougeL_recall": 0.21240429042053888, "rougeL_recall_stderr": 0.0020452824149258956, "rougeLsum_fmeasure": 0.18905151622482155, "rougeLsum_fmeasure_stderr": 0.0016692502782787643, "rougeLsum_precision": 0.16352244262880908, "rougeLsum_precision_stderr": 0.0018872605104035078, "rougeLsum_recall": 0.2749190558193557, "rougeLsum_recall_stderr": 0.002492631782723321}}, "3": {"tldr_en": {"bleu": 2.1104572563587314, "bleu_stderr": 0.08130929312280372, "rouge1_fmeasure": 0.16643706321643362, "rouge1_fmeasure_stderr": 0.0020704146578302326, "rouge1_precision": 0.14882059286798324, "rouge1_precision_stderr": 0.0022373461300931904, "rouge1_recall": 0.24050957204964596, "rouge1_recall_stderr": 0.0030817740969047145, "rouge2_fmeasure": 0.0361752103611802, "rouge2_fmeasure_stderr": 0.000867704104426404, "rouge2_precision": 0.03181983589104918, "rouge2_precision_stderr": 0.0008484419112906057, "rouge2_recall": 0.05484288322789256, "rouge2_recall_stderr": 0.0014960971078962267, "rougeL_fmeasure": 0.11962154613019327, "rougeL_fmeasure_stderr": 0.0014270812276544398, "rougeL_precision": 0.10654366188722789, "rougeL_precision_stderr": 0.0015926951137942584, "rougeL_recall": 0.17705682236326656, "rougeL_recall_stderr": 0.002371382040095437, "rougeLsum_fmeasure": 0.15701568648694605, "rougeLsum_fmeasure_stderr": 0.001941607990077885, "rougeLsum_precision": 0.14031012069279475, "rougeLsum_precision_stderr": 0.0021128033295454685, "rougeLsum_recall": 0.2280011194950691, "rougeLsum_recall_stderr": 0.002945699576253965}}, "4": {"tldr_en": {"bleu": 0.4691224289773883, "bleu_stderr": 0.02668327939721337, "rouge1_fmeasure": 0.05291772897577509, "rouge1_fmeasure_stderr": 0.0017907780517303251, "rouge1_precision": 0.04882282454207474, "rouge1_precision_stderr": 0.0018421430903010254, "rouge1_recall": 0.07876047438791374, "rouge1_recall_stderr": 0.002697214616618726, "rouge2_fmeasure": 0.011760404029928792, "rouge2_fmeasure_stderr": 0.0005829032307815198, "rouge2_precision": 0.01077293516300109, "rouge2_precision_stderr": 0.0005917384833393335, "rouge2_recall": 0.018348282948383934, "rouge2_recall_stderr": 0.0010183488719467035, "rougeL_fmeasure": 0.03910342186337772, "rougeL_fmeasure_stderr": 0.0012989884715958904, "rougeL_precision": 0.036110109432090025, "rougeL_precision_stderr": 0.001374477701533682, "rougeL_recall": 0.05971330398388186, "rougeL_recall_stderr": 0.0020872379456574647, "rougeLsum_fmeasure": 0.049731919009013095, "rougeLsum_fmeasure_stderr": 0.0016762102641413167, "rougeLsum_precision": 0.045926119483004395, "rougeLsum_precision_stderr": 0.0017391323394054688, "rougeLsum_recall": 0.07417627776667039, "rougeLsum_recall_stderr": 0.0025389281954311367}}, "5": {"tldr_en": {"bleu": 9.290848886467249e-07, "bleu_stderr": 1.7114521557633313e-06, "rouge1_fmeasure": 0.008433400400641064, "rouge1_fmeasure_stderr": 0.0007845519354746148, "rouge1_precision": 0.00810456902224064, "rouge1_precision_stderr": 0.0008295622235488356, "rouge1_recall": 0.012892068442699021, "rouge1_recall_stderr": 0.0012439840243997097, "rouge2_fmeasure": 0.001800717466655775, "rouge2_fmeasure_stderr": 0.00022472022265705173, "rouge2_precision": 0.001717931713356291, "rouge2_precision_stderr": 0.00023161121403494434, "rouge2_recall": 0.0028267780226751624, "rouge2_recall_stderr": 0.00038800429271119996, "rougeL_fmeasure": 0.006285400183131738, "rougeL_fmeasure_stderr": 0.0005802251499635472, "rougeL_precision": 0.0060439886510759554, "rougeL_precision_stderr": 0.000615759737534485, "rougeL_recall": 0.009783049887326086, "rougeL_recall_stderr": 0.0009727833840458493, "rougeLsum_fmeasure": 0.007924335842795362, "rougeLsum_fmeasure_stderr": 0.0007327104926757877, "rougeLsum_precision": 0.0076696483874971145, "rougeLsum_precision_stderr": 0.0007904189857688219, "rougeLsum_recall": 0.01212609963804329, "rougeLsum_recall_stderr": 0.0011678377048075187}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 1.2766060742328618, "bleu_stderr": 0.033382297496973044, "rouge1_fmeasure": 0.15467556742530433, "rouge1_fmeasure_stderr": 0.0014870962026354128, "rouge1_precision": 0.12547708059065077, "rouge1_precision_stderr": 0.0016991149775388303, "rouge1_recall": 0.23286096473540036, "rouge1_recall_stderr": 0.002096871122935081, "rouge2_fmeasure": 0.024539136332226045, "rouge2_fmeasure_stderr": 0.0006053943117133528, "rouge2_precision": 0.020679772826704766, "rouge2_precision_stderr": 0.0006689218506654367, "rouge2_recall": 0.03586683743869036, "rouge2_recall_stderr": 0.0008739755877011557, "rougeL_fmeasure": 0.1535691608718009, "rougeL_fmeasure_stderr": 0.0014593610156894993, "rougeL_precision": 0.1237352883610742, "rougeL_precision_stderr": 0.0015822386288611187, "rougeL_recall": 0.23190983665582457, "rougeL_recall_stderr": 0.0020952712936508694, "rougeLsum_fmeasure": 0.11750764811037896, "rougeLsum_fmeasure_stderr": 0.0011824353244648067, "rougeLsum_precision": 0.09629626695764527, "rougeLsum_precision_stderr": 0.001458815570353432, "rougeLsum_recall": 0.17660986438802767, "rougeLsum_recall_stderr": 0.001647260183147006}}, "1": {"generate_text_restaurant": {"bleu": 9.971524127225308, "bleu_stderr": 0.10544280951045465, "rouge1_fmeasure": 0.4113655457313639, "rouge1_fmeasure_stderr": 0.0022474772878560124, "rouge1_precision": 0.48231110383057557, "rouge1_precision_stderr": 0.0032247228835386517, "rouge1_recall": 0.403997228531794, "rouge1_recall_stderr": 0.0028600003192301073, "rouge2_fmeasure": 0.1793035326067927, "rouge2_fmeasure_stderr": 0.0018252903214182239, "rouge2_precision": 0.2130032822750816, "rouge2_precision_stderr": 0.0023661910744460224, "rouge2_recall": 0.17583012878246712, "rouge2_recall_stderr": 0.001978305147161013, "rougeL_fmeasure": 0.29475151710386843, "rougeL_fmeasure_stderr": 0.001863428554324611, "rougeL_precision": 0.3479327379612941, "rougeL_precision_stderr": 0.0027285680175982486, "rougeL_recall": 0.28935051237673826, "rougeL_recall_stderr": 0.0022709879114623396, "rougeLsum_fmeasure": 0.33218523237694836, "rougeLsum_fmeasure_stderr": 0.002132622458139582, "rougeLsum_precision": 0.39081628521576756, "rougeLsum_precision_stderr": 0.0029962237793696206, "rougeLsum_recall": 0.3259151337760425, "rougeLsum_recall_stderr": 0.002573842992772049}}, "2": {"generate_text_restaurant": {"bleu": 11.009017189958726, "bleu_stderr": 0.11145987575879608, "rouge1_fmeasure": 0.43104311865962835, "rouge1_fmeasure_stderr": 0.0021779427028603892, "rouge1_precision": 0.5147310358802538, "rouge1_precision_stderr": 0.003396653197723534, "rouge1_recall": 0.41720988690209326, "rouge1_recall_stderr": 0.002792457559765853, "rouge2_fmeasure": 0.2002542357997297, "rouge2_fmeasure_stderr": 0.0017902090129902814, "rouge2_precision": 0.24498889329212936, "rouge2_precision_stderr": 0.002608508121965644, "rouge2_recall": 0.19327099949467277, "rouge2_recall_stderr": 0.001959163536842046, "rougeL_fmeasure": 0.30590576351723786, "rougeL_fmeasure_stderr": 0.0018552213291573585, "rougeL_precision": 0.36812722202759224, "rougeL_precision_stderr": 0.0029336157567466338, "rougeL_recall": 0.2964234427792765, "rougeL_recall_stderr": 0.0022900011257602723, "rougeLsum_fmeasure": 0.34760227841277236, "rougeLsum_fmeasure_stderr": 0.0021182372608920443, "rougeLsum_precision": 0.416924976940603, "rougeLsum_precision_stderr": 0.003204078619564438, "rougeLsum_recall": 0.33621578141510805, "rougeLsum_recall_stderr": 0.0025598541840636643}}, "3": {"generate_text_restaurant": {"bleu": 11.37013872681925, "bleu_stderr": 0.1248535458793912, "rouge1_fmeasure": 0.4382518972315406, "rouge1_fmeasure_stderr": 0.002120900374137443, "rouge1_precision": 0.5262376572196412, "rouge1_precision_stderr": 0.003314216010987937, "rouge1_recall": 0.4203811757292955, "rouge1_recall_stderr": 0.0027242623347569794, "rouge2_fmeasure": 0.2083080407376916, "rouge2_fmeasure_stderr": 0.0017923004828278104, "rouge2_precision": 0.2555054900714246, "rouge2_precision_stderr": 0.0025360200082144213, "rouge2_recall": 0.19936173892529557, "rouge2_recall_stderr": 0.001968228951567367, "rougeL_fmeasure": 0.30745568780724575, "rougeL_fmeasure_stderr": 0.0018843522431812505, "rougeL_precision": 0.3705189491307532, "rougeL_precision_stderr": 0.0028470148719156275, "rougeL_recall": 0.2958881905119737, "rougeL_recall_stderr": 0.0022971405804365535, "rougeLsum_fmeasure": 0.3545216421140483, "rougeLsum_fmeasure_stderr": 0.00212376511748824, "rougeLsum_precision": 0.42642680843427827, "rougeLsum_precision_stderr": 0.003136183576523699, "rougeLsum_recall": 0.34024569366071405, "rougeLsum_recall_stderr": 0.002549897845983359}}, "4": {"generate_text_restaurant": {"bleu": 11.765340533551441, "bleu_stderr": 0.1912402786333196, "rouge1_fmeasure": 0.44393544366679405, "rouge1_fmeasure_stderr": 0.0021690010152583634, "rouge1_precision": 0.5306810580993595, "rouge1_precision_stderr": 0.0033851394123312253, "rouge1_recall": 0.42528611686964685, "rouge1_recall_stderr": 0.0026503481090942404, "rouge2_fmeasure": 0.21381876391107585, "rouge2_fmeasure_stderr": 0.0018342178017127435, "rouge2_precision": 0.260418105723064, "rouge2_precision_stderr": 0.0025790052457071106, "rouge2_recall": 0.20445058835077626, "rouge2_recall_stderr": 0.0019669109848647025, "rougeL_fmeasure": 0.31075327922766594, "rougeL_fmeasure_stderr": 0.0019052938372683594, "rougeL_precision": 0.37225379044451273, "rougeL_precision_stderr": 0.0028559068973251483, "rougeL_recall": 0.2989580220460878, "rougeL_recall_stderr": 0.0022621251801345312, "rougeLsum_fmeasure": 0.36042783225590935, "rougeLsum_fmeasure_stderr": 0.002153038065829124, "rougeLsum_precision": 0.4312812867418651, "rougeLsum_precision_stderr": 0.003185050048493793, "rougeLsum_recall": 0.3457653768297206, "rougeLsum_recall_stderr": 0.002509286441413888}}, "5": {"generate_text_restaurant": {"bleu": 11.642699930069227, "bleu_stderr": 0.1665369304874196, "rouge1_fmeasure": 0.44527849888326165, "rouge1_fmeasure_stderr": 0.00212920846401032, "rouge1_precision": 0.5325771024895927, "rouge1_precision_stderr": 0.003324417097878668, "rouge1_recall": 0.423375363663033, "rouge1_recall_stderr": 0.002579776398819506, "rouge2_fmeasure": 0.21356366108349217, "rouge2_fmeasure_stderr": 0.0018086595084145472, "rouge2_precision": 0.26000882478166104, "rouge2_precision_stderr": 0.0025160583279758833, "rouge2_recall": 0.2023827705716057, "rouge2_recall_stderr": 0.0019083505179989817, "rougeL_fmeasure": 0.31225656411530295, "rougeL_fmeasure_stderr": 0.0018997774824826212, "rougeL_precision": 0.37345338410021045, "rougeL_precision_stderr": 0.0027850387825540343, "rougeL_recall": 0.29841219926012585, "rougeL_recall_stderr": 0.0022412056697221224, "rougeLsum_fmeasure": 0.36317108046262075, "rougeLsum_fmeasure_stderr": 0.0021475431353111018, "rougeLsum_precision": 0.4347592206047231, "rougeLsum_precision_stderr": 0.003147641490452167, "rougeLsum_recall": 0.34531753802150883, "rougeLsum_recall_stderr": 0.002441753077630109}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 2.0741395710975095, "bleu_stderr": 0.08597567591183493, "rouge1_fmeasure": 0.2156420598991778, "rouge1_fmeasure_stderr": 0.00263185112572885, "rouge1_precision": 0.1710772835102388, "rouge1_precision_stderr": 0.002582017048828936, "rouge1_recall": 0.3373740585909959, "rouge1_recall_stderr": 0.004318919243908899, "rouge2_fmeasure": 0.04884054932435322, "rouge2_fmeasure_stderr": 0.0016585250835702103, "rouge2_precision": 0.03815200927229576, "rouge2_precision_stderr": 0.0014072364633565078, "rouge2_recall": 0.0786744064818293, "rouge2_recall_stderr": 0.0026804574552702818, "rougeL_fmeasure": 0.16101456985244528, "rougeL_fmeasure_stderr": 0.0020610939231262555, "rougeL_precision": 0.12754160270794315, "rougeL_precision_stderr": 0.002011334698725272, "rougeL_recall": 0.25334667587072296, "rougeL_recall_stderr": 0.003450143632066797, "rougeLsum_fmeasure": 0.16981783764753203, "rougeLsum_fmeasure_stderr": 0.002226137523389508, "rougeLsum_precision": 0.13385208533719228, "rougeLsum_precision_stderr": 0.002070645698817516, "rougeLsum_recall": 0.26848842566929143, "rougeLsum_recall_stderr": 0.0038523767507661405}}, "1": {"article_DOC_summary": {"bleu": 1.1246061582895406, "bleu_stderr": 0.07747059021612675, "rouge1_fmeasure": 0.15837125050520046, "rouge1_fmeasure_stderr": 0.0023055850072850443, "rouge1_precision": 0.11227417163381835, "rouge1_precision_stderr": 0.0017039218550246112, "rouge1_recall": 0.2797248751495629, "rouge1_recall_stderr": 0.003968857163602909, "rouge2_fmeasure": 0.026630545400190872, "rouge2_fmeasure_stderr": 0.0012106703751066281, "rouge2_precision": 0.018669833521043514, "rouge2_precision_stderr": 0.0008449378560881147, "rouge2_recall": 0.04827881607393628, "rouge2_recall_stderr": 0.002284155004021152, "rougeL_fmeasure": 0.12365741491966617, "rougeL_fmeasure_stderr": 0.001744614390045227, "rougeL_precision": 0.08743651997872359, "rougeL_precision_stderr": 0.0012692664754791996, "rougeL_recall": 0.22012328317880311, "rougeL_recall_stderr": 0.003179126144947638, "rougeLsum_fmeasure": 0.12855514629984804, "rougeLsum_fmeasure_stderr": 0.0018970590100685048, "rougeLsum_precision": 0.09091214915987274, "rougeLsum_precision_stderr": 0.0013821688490987276, "rougeLsum_recall": 0.22855737113252247, "rougeLsum_recall_stderr": 0.0034018065673890674}}, "2": {"article_DOC_summary": {"bleu": 1.083987545697224, "bleu_stderr": 0.0951603405593235, "rouge1_fmeasure": 0.15883481893910234, "rouge1_fmeasure_stderr": 0.0022699060879070535, "rouge1_precision": 0.11250317157809601, "rouge1_precision_stderr": 0.0016800664803736658, "rouge1_recall": 0.28113282823526276, "rouge1_recall_stderr": 0.003945997628456255, "rouge2_fmeasure": 0.02705070058613688, "rouge2_fmeasure_stderr": 0.0012259402316261174, "rouge2_precision": 0.01896938772049727, "rouge2_precision_stderr": 0.0008643828022382121, "rouge2_recall": 0.049173235460005654, "rouge2_recall_stderr": 0.002268647709705696, "rougeL_fmeasure": 0.1248624072282009, "rougeL_fmeasure_stderr": 0.0017218083377439604, "rougeL_precision": 0.08821548713657433, "rougeL_precision_stderr": 0.001257682577357835, "rougeL_recall": 0.22267200234218015, "rougeL_recall_stderr": 0.003150822045727067, "rougeLsum_fmeasure": 0.1293633765948801, "rougeLsum_fmeasure_stderr": 0.0018724040714540883, "rougeLsum_precision": 0.09143863793787037, "rougeLsum_precision_stderr": 0.0013675216267640294, "rougeLsum_recall": 0.23035645576125668, "rougeLsum_recall_stderr": 0.003395221254818866}}, "3": {"article_DOC_summary": {"bleu": 1.0722820327593516, "bleu_stderr": 0.09885521374509743, "rouge1_fmeasure": 0.1568851125966369, "rouge1_fmeasure_stderr": 0.0023595898685490934, "rouge1_precision": 0.1135683171554586, "rouge1_precision_stderr": 0.0018252408618523069, "rouge1_recall": 0.2733846183658498, "rouge1_recall_stderr": 0.004127294944074159, "rouge2_fmeasure": 0.025996659748247403, "rouge2_fmeasure_stderr": 0.001202554493648326, "rouge2_precision": 0.018441537770525027, "rouge2_precision_stderr": 0.0008593607153443226, "rouge2_recall": 0.046956157677330496, "rouge2_recall_stderr": 0.0022480399509630807, "rougeL_fmeasure": 0.12213531817307888, "rougeL_fmeasure_stderr": 0.001820148746643857, "rougeL_precision": 0.08824288636817447, "rougeL_precision_stderr": 0.0013936029206214834, "rougeL_recall": 0.21403488032801135, "rougeL_recall_stderr": 0.0033187592114637225, "rougeLsum_fmeasure": 0.12753462874453708, "rougeLsum_fmeasure_stderr": 0.001953792409491164, "rougeLsum_precision": 0.09209123877139916, "rougeLsum_precision_stderr": 0.0014864917206167194, "rougeLsum_recall": 0.22350234682822415, "rougeLsum_recall_stderr": 0.00353686596355823}}, "4": {"article_DOC_summary": {"bleu": 0.5328790203575752, "bleu_stderr": 0.08576903026751956, "rouge1_fmeasure": 0.04186692901767099, "rouge1_fmeasure_stderr": 0.0023656062725519998, "rouge1_precision": 0.03474932144936362, "rouge1_precision_stderr": 0.002201931313691675, "rouge1_recall": 0.06689455692536692, "rouge1_recall_stderr": 0.0038788599391435565, "rouge2_fmeasure": 0.007066756182933345, "rouge2_fmeasure_stderr": 0.000727809037435576, "rouge2_precision": 0.005643400181474951, "rouge2_precision_stderr": 0.0007048683985523554, "rouge2_recall": 0.012053130076333454, "rouge2_recall_stderr": 0.001283667991361848, "rougeL_fmeasure": 0.033123659489118114, "rougeL_fmeasure_stderr": 0.0018362158780032708, "rougeL_precision": 0.02758638485788023, "rougeL_precision_stderr": 0.0016907629167725257, "rougeL_recall": 0.0531079976861651, "rougeL_recall_stderr": 0.003067848877689164, "rougeLsum_fmeasure": 0.03498061599676034, "rougeLsum_fmeasure_stderr": 0.0019684597857678363, "rougeLsum_precision": 0.029084229332332977, "rougeLsum_precision_stderr": 0.00179355123233279, "rougeLsum_recall": 0.05597642727155089, "rougeLsum_recall_stderr": 0.0032615168998855935}}, "5": {"article_DOC_summary": {"bleu": 2.2373133015544847e-38, "bleu_stderr": 2.788714232530993e-33, "rouge1_fmeasure": 0.002150076877118036, "rouge1_fmeasure_stderr": 0.0005715576930386714, "rouge1_precision": 0.002328789088383691, "rouge1_precision_stderr": 0.0006187865720825858, "rouge1_recall": 0.00208064502929238, "rouge1_recall_stderr": 0.0005621215174690571, "rouge2_fmeasure": 8.081906797549185e-05, "rouge2_fmeasure_stderr": 5.7158807305374844e-05, "rouge2_precision": 0.00010405105438401775, "rouge2_precision_stderr": 7.357743885200423e-05, "rouge2_recall": 6.636445315690599e-05, "rouge2_recall_stderr": 4.704542030779156e-05, "rougeL_fmeasure": 0.001640744777975664, "rougeL_fmeasure_stderr": 0.00043598430281185013, "rougeL_precision": 0.0017927242516879765, "rougeL_precision_stderr": 0.00047914637491014385, "rougeL_recall": 0.0015642137359017942, "rougeL_recall_stderr": 0.00041540866296455953, "rougeLsum_fmeasure": 0.0017214827651769189, "rougeLsum_fmeasure_stderr": 0.00045046792515902423, "rougeLsum_precision": 0.0018939725840683842, "rougeLsum_precision_stderr": 0.0005004552190432495, "rougeLsum_recall": 0.001635109178020478, "rougeLsum_recall_stderr": 0.00042818036276967824}}}} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..4913f81b0136facfbf0eb503725f7a4ff4b483b7 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.32969762409287173, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03350207893898449 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07489491650147996, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001916354345656983 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.300291813063712, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00461536297454604 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.10919706809885917, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0021601422959730493 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03439062652684824, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0011545837032529334 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.14370713443920666, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003246173363178369 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05063701387421738, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0013546648556391975 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07070012219921042, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0017208007855753348 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.2895484949203548, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0044970181242023404 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10382750267360731, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0019706115754186356 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07104242339944349, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017912432501280336 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.2857359841499445, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004341838499174088 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10361568313155001, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002010621664327297 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a62b38b544cdb9fc341a6c9d8bb1098aaa009696 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.4359939783272789, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.041779670416334125 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07266279503165236, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0017099935201375816 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3475964219389317, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00506748933764113 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11088292832283875, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019702183179370605 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03335287604120367, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001128095255122388 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1660344328298045, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0035028476813622595 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05068936829455799, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012538981392173827 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06772928954103168, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015712765252988345 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3260811514542075, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004710148749523479 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10353647374043018, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017861554904427183 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06867664726380934, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0016318384908350385 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.32775048198841006, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0046848102542069335 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1047015599685259, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018609963369853742 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..823f13b663e47ff75c4a77c44b2122829e832cf5 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5047753641043208, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03242172296180824 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07334706790054754, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013930615456138227 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3737700063497622, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005196576717483812 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1150888371627504, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018709716201208576 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.032868072571177076, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000815253916940581 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17803179222143828, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003604190340424885 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.051840665529172124, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011509985318477927 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06734503744998965, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001233876908858107 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3449240970361082, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004694373882052961 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10581169764988507, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016601816301532264 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06919868166026465, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013042029174787707 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3526754078681369, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004836506777085055 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10857869554945465, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017505188501646559 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..0e3111b50985926474ba8843ba4405462a676d54 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6249385322673848, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.023211819786736334 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07372614912850947, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001359300603084539 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3888611122018525, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0053578637277047906 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11637468420417033, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018331195406713198 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.033416989091581, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008041939460804035 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1903256864921483, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038053895221829945 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05316112071013902, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011465281622819825 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06697897307455199, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0011891190081388082 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3547382398864492, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004815238098721177 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10582598758235875, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016101686735076229 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.0694765908871884, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012821064008090915 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.364488357943653, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0048866912766196875 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.10953693694712942, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017209757445741357 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..c662e2448781f11789766f7e313fcbeb8aea8fde --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6172877259530323, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.0352446996928639 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0748843501395415, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001381267162660691 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39598227128772256, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.00522226055907367 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1180321735790567, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018211841415573945 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.033363716686448004, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008232905700585103 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.18904409931911847, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0036763179024498203 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05290384691957595, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011327428150165345 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06681400109757821, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012097158147883198 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3551645214739529, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004603707682826054 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1053542922815303, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015788673153327966 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07014407223382836, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013067256802706008 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3699177055550494, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0047899231539846945 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11042261394743104, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001708240502656495 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..94afc4d06944c5e577d87c444103849e472e5843 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6739230942233659, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03781903865026685 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07434118591062619, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0013606852466120714 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40517103911737706, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005207962506245739 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11775202851872192, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017322424295727937 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03309571045270455, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000762355738688032 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.1960621498928731, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037598520682319884 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.053092972525274194, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0010965950400499984 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.06663527060233249, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001226540610105808 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3640849747385268, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004640046414372116 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10543601362203549, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015178302726180323 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06962894335162277, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.001291561351449583 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3794277979681509, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004818380083375467 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11016000573694927, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016169723040308337 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..0048888de626e05e979850449f7fe49cc000eeac --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15541888954389302, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018896399566670286 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2609485104955259, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002636869555478932 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18074785424679843, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018330825958722083 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.031340296740352346, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0007364805410626298 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05475940923731912, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0013900561092136223 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0367425698800636, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008312312379815959 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11824683156742628, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012988846637495886 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.20619299633996296, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00212551360652741 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.13925315500169771, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012900858881895007 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14243870027384645, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017153432680596468 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.24072866043059984, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0024483585527040877 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1659756245930406, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016665877399642023 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.5656365853870153, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06994438419251063 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..09d984d2ade207cd36dcf7d77948f0927dc37323 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.16880681390038538, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019611277767498836 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.28525722098489775, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002677390028605212 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.19671251716356983, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001845617511049733 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03604438137203516, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000869171473451728 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06302505515896178, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001516286602693054 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.041911863785581135, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008870741133490255 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11944422928337016, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001289252852685886 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.20967875473639086, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002077526143241249 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14075220661179533, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001215604718401757 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.15784656842847097, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018258770460077972 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.26803761801382864, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002534338768264281 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.18414503390476486, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017143415167847412 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.973383093888403, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.062022250654948985 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..7acbce1f1d1246703da9c6e80d494290a49cfd16 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1736169708012349, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001996587278110062 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2912556116042534, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002623711899034249 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.20072566114135942, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017824984220287418 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0384761806811168, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009080570700775258 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06572148998847567, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015105024802730654 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.04387417540357548, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008841272873745032 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12265905134544655, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001362079458617771 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21240429042053888, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020452824149258956 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14291058225462885, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0011859440485204546 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.16352244262880908, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018872605104035078 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2749190558193557, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002492631782723321 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.18905151622482155, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016692502782787643 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.1175282747257644, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.06998742940696125 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..fa43f14a60c1cb18ec0cee6c83657b3c2bc19b47 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.14882059286798324, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0022373461300931904 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.24050957204964596, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0030817740969047145 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.16643706321643362, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020704146578302326 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03181983589104918, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008484419112906057 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.05484288322789256, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0014960971078962267 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0361752103611802, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000867704104426404 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.10654366188722789, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015926951137942584 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.17705682236326656, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002371382040095437 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.11962154613019327, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0014270812276544398 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14031012069279475, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0021128033295454685 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2280011194950691, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.002945699576253965 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.15701568648694605, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.001941607990077885 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.1104572563587314, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.08130929312280372 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..77802fa00a049082ef50f4c7146dfabcc362532e --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.04882282454207474, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0018421430903010254 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.07876047438791374, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002697214616618726 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.05291772897577509, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0017907780517303251 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.01077293516300109, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0005917384833393335 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.018348282948383934, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0010183488719467035 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.011760404029928792, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0005829032307815198 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.036110109432090025, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001374477701533682 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.05971330398388186, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0020872379456574647 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.03910342186337772, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012989884715958904 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.045926119483004395, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017391323394054688 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.07417627776667039, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025389281954311367 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.049731919009013095, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016762102641413167 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.4691224289773883, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.02668327939721337 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..52a74ceef379aeb5809094899f16fcdae1f72fba --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.00810456902224064, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0008295622235488356 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.012892068442699021, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0012439840243997097 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.008433400400641064, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0007845519354746148 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.001717931713356291, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.00023161121403494434 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0028267780226751624, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.00038800429271119996 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.001800717466655775, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.00022472022265705173 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.0060439886510759554, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.000615759737534485 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.009783049887326086, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0009727833840458493 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006285400183131738, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0005802251499635472 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.0076696483874971145, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007904189857688219 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.01212609963804329, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0011678377048075187 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.007924335842795362, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007327104926757877 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 9.290848886467249e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.7114521557633313e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..9e57d1b2e174d725a4674d2b89aa7eba597e4920 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 1.2766060742328618, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.033382297496973044 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.12547708059065077, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0016991149775388303 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.23286096473540036, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002096871122935081 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.15467556742530433, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0014870962026354128 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.020679772826704766, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0006689218506654367 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.03586683743869036, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0008739755877011557 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.024539136332226045, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0006053943117133528 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.1237352883610742, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0015822386288611187 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.23190983665582457, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0020952712936508694 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.1535691608718009, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0014593610156894993 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.09629626695764527, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.001458815570353432 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.17660986438802767, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.001647260183147006 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.11750764811037896, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0011824353244648067 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..a3d206018dbaa64bcfcbe81630aa0c1e164d5c8d --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.971524127225308, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.10544280951045465 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.48231110383057557, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0032247228835386517 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.403997228531794, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028600003192301073 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4113655457313639, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022474772878560124 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2130032822750816, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0023661910744460224 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.17583012878246712, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001978305147161013 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1793035326067927, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018252903214182239 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3479327379612941, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0027285680175982486 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.28935051237673826, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022709879114623396 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.29475151710386843, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.001863428554324611 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.39081628521576756, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0029962237793696206 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3259151337760425, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002573842992772049 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.33218523237694836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002132622458139582 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..2478b97afdb09bc09ab058861bbdb27be5b0165f --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.009017189958726, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.11145987575879608 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5147310358802538, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003396653197723534 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.41720988690209326, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002792457559765853 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.43104311865962835, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021779427028603892 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.24498889329212936, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002608508121965644 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19327099949467277, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001959163536842046 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2002542357997297, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017902090129902814 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.36812722202759224, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0029336157567466338 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2964234427792765, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022900011257602723 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.30590576351723786, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018552213291573585 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.416924976940603, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003204078619564438 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.33621578141510805, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025598541840636643 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.34760227841277236, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021182372608920443 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a744b31e418a05ea2fd3a5bdbeaffbaaeec248d3 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.37013872681925, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1248535458793912 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5262376572196412, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003314216010987937 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.4203811757292955, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0027242623347569794 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4382518972315406, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002120900374137443 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.2555054900714246, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025360200082144213 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.19936173892529557, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.001968228951567367 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.2083080407376916, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0017923004828278104 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.3705189491307532, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028470148719156275 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2958881905119737, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022971405804365535 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.30745568780724575, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018843522431812505 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.42642680843427827, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003136183576523699 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.34024569366071405, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002549897845983359 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3545216421140483, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.00212376511748824 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a082b02304164fa4553c3523be53175ca0c2b848 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.765340533551441, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1912402786333196 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5306810580993595, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0033851394123312253 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.42528611686964685, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026503481090942404 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.44393544366679405, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021690010152583634 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.260418105723064, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025790052457071106 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.20445058835077626, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019669109848647025 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21381876391107585, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018342178017127435 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.37225379044451273, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0028559068973251483 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.2989580220460878, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022621251801345312 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.31075327922766594, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0019052938372683594 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4312812867418651, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003185050048493793 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3457653768297206, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002509286441413888 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.36042783225590935, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002153038065829124 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..81e2c5efeab93b433d224e31e59881517bdebac6 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 11.642699930069227, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1665369304874196 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.5325771024895927, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003324417097878668 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.423375363663033, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002579776398819506 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.44527849888326165, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.00212920846401032 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.26000882478166104, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0025160583279758833 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2023827705716057, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0019083505179989817 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.21356366108349217, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0018086595084145472 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.37345338410021045, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0027850387825540343 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.29841219926012585, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0022412056697221224 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.31225656411530295, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0018997774824826212 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.4347592206047231, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.003147641490452167 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.34531753802150883, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.002441753077630109 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.36317108046262075, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021475431353111018 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_0.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..f026adfe2a64b0c114f8eff6445400c35c18f613 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1710772835102388, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002582017048828936 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.3373740585909959, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004318919243908899 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.2156420598991778, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.00263185112572885 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.03815200927229576, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0014072364633565078 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0786744064818293, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0026804574552702818 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04884054932435322, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0016585250835702103 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.12754160270794315, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.002011334698725272 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.25334667587072296, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003450143632066797 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.16101456985244528, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0020610939231262555 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.13385208533719228, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.002070645698817516 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.26848842566929143, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0038523767507661405 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.16981783764753203, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.002226137523389508 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.0741395710975095, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08597567591183493 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_1.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..c8dac7779315fcdf5887cec1bf2de1cbc1b8604b --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11227417163381835, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017039218550246112 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2797248751495629, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003968857163602909 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.15837125050520046, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0023055850072850443 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.018669833521043514, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008449378560881147 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.04827881607393628, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002284155004021152 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.026630545400190872, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012106703751066281 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08743651997872359, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0012692664754791996 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.22012328317880311, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003179126144947638 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12365741491966617, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001744614390045227 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09091214915987274, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0013821688490987276 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22855737113252247, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034018065673890674 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12855514629984804, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018970590100685048 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.1246061582895406, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.07747059021612675 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_2.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..051cce5bb9a8e03f9bf4fe1d723a1ab4c46f821a --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11250317157809601, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0016800664803736658 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.28113282823526276, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003945997628456255 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.15883481893910234, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0022699060879070535 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.01896938772049727, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008643828022382121 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.049173235460005654, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002268647709705696 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.02705070058613688, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012259402316261174 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08821548713657433, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001257682577357835 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.22267200234218015, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003150822045727067 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.1248624072282009, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017218083377439604 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09143863793787037, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0013675216267640294 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.23035645576125668, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.003395221254818866 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.1293633765948801, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0018724040714540883 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.083987545697224, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.0951603405593235 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_3.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..ae0fb28faf30223cfee4df061ec988f818461af7 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.1135683171554586, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0018252408618523069 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2733846183658498, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004127294944074159 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1568851125966369, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0023595898685490934 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.018441537770525027, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008593607153443226 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.046956157677330496, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0022480399509630807 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.025996659748247403, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.001202554493648326 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.08824288636817447, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013936029206214834 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.21403488032801135, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033187592114637225 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12213531817307888, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001820148746643857 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09209123877139916, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014864917206167194 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22350234682822415, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00353686596355823 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.12753462874453708, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.001953792409491164 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.0722820327593516, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.09885521374509743 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_4.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..8de72a88708ad1891cb194fc06a89d514ffb32f6 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.03474932144936362, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002201931313691675 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.06689455692536692, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0038788599391435565 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04186692901767099, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0023656062725519998 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.005643400181474951, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0007048683985523554 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.012053130076333454, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.001283667991361848 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.007066756182933345, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.000727809037435576 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.02758638485788023, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0016907629167725257 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0531079976861651, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.003067848877689164 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.033123659489118114, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018362158780032708 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.029084229332332977, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.00179355123233279 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.05597642727155089, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0032615168998855935 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.03498061599676034, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019684597857678363 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.5328790203575752, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08576903026751956 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_5.json b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..53db39f3cb107e8e0825cf607de79273d9ac6ab1 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/generation/slim.4b284b6bc4seed3_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.002328789088383691, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0006187865720825858 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.00208064502929238, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0005621215174690571 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.002150076877118036, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0005715576930386714 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00010405105438401775, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 7.357743885200423e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 6.636445315690599e-05, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 4.704542030779156e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 8.081906797549185e-05, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 5.7158807305374844e-05 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.0017927242516879765, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.00047914637491014385 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0015642137359017942, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.00041540866296455953 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.001640744777975664, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.00043598430281185013 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0018939725840683842, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0005004552190432495 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.001635109178020478, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.00042818036276967824 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.0017214827651769189, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.00045046792515902423 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 2.2373133015544847e-38, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 2.788714232530993e-33 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed3/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_0.csv b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..8bfc9e85f6aac8ef2010d151bd5d6d53f830adb2 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.318,0.014734079309311901,0 +anli_r2,acc,0.354,0.015129868238451772,0 +anli_r3,acc,0.3525,0.013797164918918366,0 +arc_challenge,acc,0.26109215017064846,0.012835523909473848,0 +arc_challenge,acc_norm,0.2764505119453925,0.013069662474252425,0 +arc_easy,acc,0.569023569023569,0.010161552863493751,0 +arc_easy,acc_norm,0.49747474747474746,0.01025965266878347,0 +boolq,acc,0.5522935779816514,0.008697094687974059,1 +cb,acc,0.4107142857142857,0.06633634150359541,1 +cb,f1,0.3024109014675052,,1 +copa,acc,0.72,0.04512608598542126,0 +hellaswag,acc,0.45628360884286,0.004970672651595843,0 +hellaswag,acc_norm,0.5851424019119698,0.004916905095810849,0 +piqa,acc,0.73449401523395,0.010303308653024429,0 +piqa,acc_norm,0.7421109902067464,0.010206956662056243,0 +rte,acc,0.5306859205776173,0.03003973059219781,0 +sciq,acc,0.826,0.01199449323097343,0 +sciq,acc_norm,0.725,0.014127086556490526,0 +storycloze_2016,acc,0.7108498129342598,0.010484068799942074,0 +winogrande,acc,0.5595895816890292,0.013952330311915591,0 diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_0.json b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_0.json new file mode 100644 index 0000000000000000000000000000000000000000..da7e78ad2aa93cf88f4fd0128700e6b40ff2512d --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.318, + "acc_stderr": 0.014734079309311901 + }, + "anli_r2": { + "acc": 0.354, + "acc_stderr": 0.015129868238451772 + }, + "anli_r3": { + "acc": 0.3525, + "acc_stderr": 0.013797164918918366 + }, + "cb": { + "acc": 0.4107142857142857, + "acc_stderr": 0.06633634150359541, + "f1": 0.3024109014675052 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542126 + }, + "hellaswag": { + "acc": 0.45628360884286, + "acc_stderr": 0.004970672651595843, + "acc_norm": 0.5851424019119698, + "acc_norm_stderr": 0.004916905095810849 + }, + "rte": { + "acc": 0.5306859205776173, + "acc_stderr": 0.03003973059219781 + }, + "winogrande": { + "acc": 0.5595895816890292, + "acc_stderr": 0.013952330311915591 + }, + "storycloze_2016": { + "acc": 0.7108498129342598, + "acc_stderr": 0.010484068799942074 + }, + "boolq": { + "acc": 0.5522935779816514, + "acc_stderr": 0.008697094687974059 + }, + "arc_easy": { + "acc": 0.569023569023569, + "acc_stderr": 0.010161552863493751, + "acc_norm": 0.49747474747474746, + "acc_norm_stderr": 0.01025965266878347 + }, + "arc_challenge": { + "acc": 0.26109215017064846, + "acc_stderr": 0.012835523909473848, + "acc_norm": 0.2764505119453925, + "acc_norm_stderr": 0.013069662474252425 + }, + "sciq": { + "acc": 0.826, + "acc_stderr": 0.01199449323097343, + "acc_norm": 0.725, + "acc_norm_stderr": 0.014127086556490526 + }, + "piqa": { + "acc": 0.73449401523395, + "acc_stderr": 0.010303308653024429, + "acc_norm": 0.7421109902067464, + "acc_norm_stderr": 0.010206956662056243 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_1.csv b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..b085786fa008231d87aa682feb3da8a83b99f72b --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.33,0.014876872027456732,0 +anli_r2,acc,0.333,0.014910846164229857,0 +anli_r3,acc,0.3425,0.013704669762934727,0 +arc_challenge,acc,0.26109215017064846,0.012835523909473848,0 +arc_challenge,acc_norm,0.28924914675767915,0.013250012579393441,0 +arc_easy,acc,0.5900673400673401,0.01009195352750625,0 +arc_easy,acc_norm,0.5538720538720538,0.010200057828765008,0 +boolq,acc,0.5706422018348624,0.008657333755353679,1 +cb,acc,0.48214285714285715,0.0673769750864465,1 +cb,f1,0.31768388106416273,,1 +copa,acc,0.7,0.046056618647183814,0 +hellaswag,acc,0.45439155546703847,0.004968979259738328,0 +hellaswag,acc_norm,0.5930093606851224,0.004902690765066431,0 +piqa,acc,0.7383025027203483,0.01025563077270823,0 +piqa,acc_norm,0.7415669205658324,0.010213971636773315,0 +rte,acc,0.5487364620938628,0.029953149241808946,0 +sciq,acc,0.865,0.010811655372416051,0 +sciq,acc_norm,0.837,0.01168621271274684,0 +storycloze_2016,acc,0.692143238909674,0.010674598158758177,0 +winogrande,acc,0.5666929755327546,0.013926915052757352,0 diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_1.json b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_1.json new file mode 100644 index 0000000000000000000000000000000000000000..efd588e355020f381c24bb6de9dfa55b6bffe962 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.33, + "acc_stderr": 0.014876872027456732 + }, + "anli_r2": { + "acc": 0.333, + "acc_stderr": 0.014910846164229857 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934727 + }, + "cb": { + "acc": 0.48214285714285715, + "acc_stderr": 0.0673769750864465, + "f1": 0.31768388106416273 + }, + "copa": { + "acc": 0.7, + "acc_stderr": 0.046056618647183814 + }, + "hellaswag": { + "acc": 0.45439155546703847, + "acc_stderr": 0.004968979259738328, + "acc_norm": 0.5930093606851224, + "acc_norm_stderr": 0.004902690765066431 + }, + "rte": { + "acc": 0.5487364620938628, + "acc_stderr": 0.029953149241808946 + }, + "winogrande": { + "acc": 0.5666929755327546, + "acc_stderr": 0.013926915052757352 + }, + "storycloze_2016": { + "acc": 0.692143238909674, + "acc_stderr": 0.010674598158758177 + }, + "boolq": { + "acc": 0.5706422018348624, + "acc_stderr": 0.008657333755353679 + }, + "arc_easy": { + "acc": 0.5900673400673401, + "acc_stderr": 0.01009195352750625, + "acc_norm": 0.5538720538720538, + "acc_norm_stderr": 0.010200057828765008 + }, + "arc_challenge": { + "acc": 0.26109215017064846, + "acc_stderr": 0.012835523909473848, + "acc_norm": 0.28924914675767915, + "acc_norm_stderr": 0.013250012579393441 + }, + "sciq": { + "acc": 0.865, + "acc_stderr": 0.010811655372416051, + "acc_norm": 0.837, + "acc_norm_stderr": 0.01168621271274684 + }, + "piqa": { + "acc": 0.7383025027203483, + "acc_stderr": 0.01025563077270823, + "acc_norm": 0.7415669205658324, + "acc_norm_stderr": 0.010213971636773315 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_2.csv b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..3a047efdf9a61ee4faf3f229b7abc8d0afdc2a51 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.31,0.0146326386586329,0 +anli_r2,acc,0.335,0.014933117490932573,0 +anli_r3,acc,0.30916666666666665,0.013346684134591945,0 +arc_challenge,acc,0.2790102389078498,0.013106784883601333,0 +arc_challenge,acc_norm,0.2901023890784983,0.013261573677520766,0 +arc_easy,acc,0.6001683501683501,0.010051788039412923,0 +arc_easy,acc_norm,0.5698653198653199,0.010159130445178514,0 +boolq,acc,0.5896024464831804,0.008603488048617523,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.2349033816425121,,1 +copa,acc,0.72,0.04512608598542127,0 +hellaswag,acc,0.45289782911770565,0.004967591267557399,0 +hellaswag,acc_norm,0.5914160525791675,0.00490567440861401,0 +piqa,acc,0.7404787812840044,0.010227939888173922,0 +piqa,acc_norm,0.7437431991294886,0.010185787831565055,0 +rte,acc,0.47653429602888087,0.030063300411902652,0 +sciq,acc,0.887,0.01001655286669685,0 +sciq,acc_norm,0.852,0.01123486636423527,0 +storycloze_2016,acc,0.692143238909674,0.010674598158758175,0 +winogrande,acc,0.5619573796369376,0.013944181296470804,0 diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_2.json b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_2.json new file mode 100644 index 0000000000000000000000000000000000000000..738ad260d79db592340595c36ca1f8fa5a37b738 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.31, + "acc_stderr": 0.0146326386586329 + }, + "anli_r2": { + "acc": 0.335, + "acc_stderr": 0.014933117490932573 + }, + "anli_r3": { + "acc": 0.30916666666666665, + "acc_stderr": 0.013346684134591945 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.2349033816425121 + }, + "copa": { + "acc": 0.72, + "acc_stderr": 0.04512608598542127 + }, + "hellaswag": { + "acc": 0.45289782911770565, + "acc_stderr": 0.004967591267557399, + "acc_norm": 0.5914160525791675, + "acc_norm_stderr": 0.00490567440861401 + }, + "rte": { + "acc": 0.47653429602888087, + "acc_stderr": 0.030063300411902652 + }, + "winogrande": { + "acc": 0.5619573796369376, + "acc_stderr": 0.013944181296470804 + }, + "storycloze_2016": { + "acc": 0.692143238909674, + "acc_stderr": 0.010674598158758175 + }, + "boolq": { + "acc": 0.5896024464831804, + "acc_stderr": 0.008603488048617523 + }, + "arc_easy": { + "acc": 0.6001683501683501, + "acc_stderr": 0.010051788039412923, + "acc_norm": 0.5698653198653199, + "acc_norm_stderr": 0.010159130445178514 + }, + "arc_challenge": { + "acc": 0.2790102389078498, + "acc_stderr": 0.013106784883601333, + "acc_norm": 0.2901023890784983, + "acc_norm_stderr": 0.013261573677520766 + }, + "sciq": { + "acc": 0.887, + "acc_stderr": 0.01001655286669685, + "acc_norm": 0.852, + "acc_norm_stderr": 0.01123486636423527 + }, + "piqa": { + "acc": 0.7404787812840044, + "acc_stderr": 0.010227939888173922, + "acc_norm": 0.7437431991294886, + "acc_norm_stderr": 0.010185787831565055 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_3.csv b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..fedb53c6eb8e77d5ba242b187cffdc0322bd5844 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.326,0.014830507204541047,0 +anli_r2,acc,0.356,0.015149042659306628,0 +anli_r3,acc,0.335,0.013630871843821474,0 +arc_challenge,acc,0.2713310580204778,0.012993807727545797,0 +arc_challenge,acc_norm,0.2960750853242321,0.013340916085246263,0 +arc_easy,acc,0.6073232323232324,0.010020646555538689,0 +arc_easy,acc_norm,0.5862794612794613,0.01010587853023813,0 +boolq,acc,0.5954128440366973,0.008584355308932687,1 +cb,acc,0.5178571428571429,0.06737697508644648,1 +cb,f1,0.43332988160574365,,1 +copa,acc,0.71,0.045604802157206845,0 +hellaswag,acc,0.45498904600677154,0.004969521827957945,0 +hellaswag,acc_norm,0.5934076877116112,0.004901936511546108,0 +piqa,acc,0.7421109902067464,0.010206956662056257,0 +piqa,acc_norm,0.749183895538629,0.010113869547069044,0 +rte,acc,0.48375451263537905,0.030080573208738064,0 +sciq,acc,0.891,0.00985982840703719,0 +sciq,acc_norm,0.869,0.010674874844837956,0 +storycloze_2016,acc,0.6980224478888295,0.010616985436073357,0 +winogrande,acc,0.5580110497237569,0.01395758407910899,0 diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_3.json b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_3.json new file mode 100644 index 0000000000000000000000000000000000000000..1d8d9bac2a5b7f48b404ab03d7c038aabcba2d27 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.326, + "acc_stderr": 0.014830507204541047 + }, + "anli_r2": { + "acc": 0.356, + "acc_stderr": 0.015149042659306628 + }, + "anli_r3": { + "acc": 0.335, + "acc_stderr": 0.013630871843821474 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644648, + "f1": 0.43332988160574365 + }, + "copa": { + "acc": 0.71, + "acc_stderr": 0.045604802157206845 + }, + "hellaswag": { + "acc": 0.45498904600677154, + "acc_stderr": 0.004969521827957945, + "acc_norm": 0.5934076877116112, + "acc_norm_stderr": 0.004901936511546108 + }, + "rte": { + "acc": 0.48375451263537905, + "acc_stderr": 0.030080573208738064 + }, + "winogrande": { + "acc": 0.5580110497237569, + "acc_stderr": 0.01395758407910899 + }, + "storycloze_2016": { + "acc": 0.6980224478888295, + "acc_stderr": 0.010616985436073357 + }, + "boolq": { + "acc": 0.5954128440366973, + "acc_stderr": 0.008584355308932687 + }, + "arc_easy": { + "acc": 0.6073232323232324, + "acc_stderr": 0.010020646555538689, + "acc_norm": 0.5862794612794613, + "acc_norm_stderr": 0.01010587853023813 + }, + "arc_challenge": { + "acc": 0.2713310580204778, + "acc_stderr": 0.012993807727545797, + "acc_norm": 0.2960750853242321, + "acc_norm_stderr": 0.013340916085246263 + }, + "sciq": { + "acc": 0.891, + "acc_stderr": 0.00985982840703719, + "acc_norm": 0.869, + "acc_norm_stderr": 0.010674874844837956 + }, + "piqa": { + "acc": 0.7421109902067464, + "acc_stderr": 0.010206956662056257, + "acc_norm": 0.749183895538629, + "acc_norm_stderr": 0.010113869547069044 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_4.csv b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..beee2264e7e02cf905f11708d44f88eb48d69d46 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.324,0.01480686473373886,0 +anli_r2,acc,0.361,0.015195720118175124,0 +anli_r3,acc,0.3641666666666667,0.013896714966807262,0 +arc_challenge,acc,0.2764505119453925,0.013069662474252425,0 +arc_challenge,acc_norm,0.2935153583617747,0.01330725044494112,0 +arc_easy,acc,0.6001683501683501,0.010051788039412911,0 +arc_easy,acc_norm,0.5787037037037037,0.010131882498193126,0 +boolq,acc,0.5868501529051988,0.008612117547803578,1 +cb,acc,0.42857142857142855,0.06672848092813058,1 +cb,f1,0.24317460317460324,,1 +copa,acc,0.75,0.04351941398892446,0 +hellaswag,acc,0.45488946425014937,0.004969431900874299,0 +hellaswag,acc_norm,0.5929097789285003,0.004902878806733035,0 +piqa,acc,0.7377584330794341,0.010262502565172445,0 +piqa,acc_norm,0.749727965179543,0.010106561880089775,0 +rte,acc,0.44765342960288806,0.029931070362939526,0 +sciq,acc,0.892,0.009820001651345693,0 +sciq,acc_norm,0.872,0.010570133761108654,0 +storycloze_2016,acc,0.7006948156066275,0.010590117252248798,0 +winogrande,acc,0.5627466456195738,0.013941393310695917,0 diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_4.json b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_4.json new file mode 100644 index 0000000000000000000000000000000000000000..745fd51c2c5d826ace00947b381c2e853e464c80 --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.324, + "acc_stderr": 0.01480686473373886 + }, + "anli_r2": { + "acc": 0.361, + "acc_stderr": 0.015195720118175124 + }, + "anli_r3": { + "acc": 0.3641666666666667, + "acc_stderr": 0.013896714966807262 + }, + "cb": { + "acc": 0.42857142857142855, + "acc_stderr": 0.06672848092813058, + "f1": 0.24317460317460324 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.45488946425014937, + "acc_stderr": 0.004969431900874299, + "acc_norm": 0.5929097789285003, + "acc_norm_stderr": 0.004902878806733035 + }, + "rte": { + "acc": 0.44765342960288806, + "acc_stderr": 0.029931070362939526 + }, + "winogrande": { + "acc": 0.5627466456195738, + "acc_stderr": 0.013941393310695917 + }, + "storycloze_2016": { + "acc": 0.7006948156066275, + "acc_stderr": 0.010590117252248798 + }, + "boolq": { + "acc": 0.5868501529051988, + "acc_stderr": 0.008612117547803578 + }, + "arc_easy": { + "acc": 0.6001683501683501, + "acc_stderr": 0.010051788039412911, + "acc_norm": 0.5787037037037037, + "acc_norm_stderr": 0.010131882498193126 + }, + "arc_challenge": { + "acc": 0.2764505119453925, + "acc_stderr": 0.013069662474252425, + "acc_norm": 0.2935153583617747, + "acc_norm_stderr": 0.01330725044494112 + }, + "sciq": { + "acc": 0.892, + "acc_stderr": 0.009820001651345693, + "acc_norm": 0.872, + "acc_norm_stderr": 0.010570133761108654 + }, + "piqa": { + "acc": 0.7377584330794341, + "acc_stderr": 0.010262502565172445, + "acc_norm": 0.749727965179543, + "acc_norm_stderr": 0.010106561880089775 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_5.csv b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..5006e4bfa54fee89ffbdb2503f006f9eb0988fcd --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.347,0.015060472031706613,0 +anli_r2,acc,0.328,0.01485384248727033,0 +anli_r3,acc,0.3475,0.013751753243291856,0 +arc_challenge,acc,0.2764505119453925,0.013069662474252427,0 +arc_challenge,acc_norm,0.28754266211604096,0.013226719056266132,0 +arc_easy,acc,0.6077441077441077,0.010018744689650043,0 +arc_easy,acc_norm,0.5833333333333334,0.01011628297778126,0 +boolq,acc,0.6064220183486239,0.00854467241848691,1 +cb,acc,0.5178571428571429,0.06737697508644647,1 +cb,f1,0.3578242744909412,,1 +copa,acc,0.75,0.04351941398892446,0 +hellaswag,acc,0.4539932284405497,0.00496861353930925,0 +hellaswag,acc_norm,0.5944035052778331,0.0049000362613090395,0 +piqa,acc,0.73449401523395,0.010303308653024429,0 +piqa,acc_norm,0.7442872687704026,0.010178690109459878,0 +rte,acc,0.48736462093862815,0.030086851767188564,0 +sciq,acc,0.899,0.009533618929340983,0 +sciq,acc_norm,0.886,0.010055103435823332,0 +storycloze_2016,acc,0.6985569214323891,0.010611646032767584,0 +winogrande,acc,0.5643251775848461,0.013935709739615713,0 diff --git a/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_5.json b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_5.json new file mode 100644 index 0000000000000000000000000000000000000000..78e8cb826c2daa1031421338b31578fc843f2a5a --- /dev/null +++ b/4b284b6bc4seed3/evaluation/rankeval/4b284b6bc4seed3_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.347, + "acc_stderr": 0.015060472031706613 + }, + "anli_r2": { + "acc": 0.328, + "acc_stderr": 0.01485384248727033 + }, + "anli_r3": { + "acc": 0.3475, + "acc_stderr": 0.013751753243291856 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.3578242744909412 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4539932284405497, + "acc_stderr": 0.00496861353930925, + "acc_norm": 0.5944035052778331, + "acc_norm_stderr": 0.0049000362613090395 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5643251775848461, + "acc_stderr": 0.013935709739615713 + }, + "storycloze_2016": { + "acc": 0.6985569214323891, + "acc_stderr": 0.010611646032767584 + }, + "boolq": { + "acc": 0.6064220183486239, + "acc_stderr": 0.00854467241848691 + }, + "arc_easy": { + "acc": 0.6077441077441077, + "acc_stderr": 0.010018744689650043, + "acc_norm": 0.5833333333333334, + "acc_norm_stderr": 0.01011628297778126 + }, + "arc_challenge": { + "acc": 0.2764505119453925, + "acc_stderr": 0.013069662474252427, + "acc_norm": 0.28754266211604096, + "acc_norm_stderr": 0.013226719056266132 + }, + "sciq": { + "acc": 0.899, + "acc_stderr": 0.009533618929340983, + "acc_norm": 0.886, + "acc_norm_stderr": 0.010055103435823332 + }, + "piqa": { + "acc": 0.73449401523395, + "acc_stderr": 0.010303308653024429, + "acc_norm": 0.7442872687704026, + "acc_norm_stderr": 0.010178690109459878 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..71a2ffa76ace7a4f6e54fba2bbae68e1f692d6e3 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a764e672b541570691b2250cf83191d497df35972253523b6c76dd22461f899f +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2866d7ee9284be66137f04d30247f5fae52300e6 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:238ec397975c2d7b90064365eeb3f5d46a71191ff334989589d2cf9554efd05c +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01d26e42d9a38fef16c2d9b145ef9dbd8ab44600 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf7874221d9c96dfacd083227e2b82eed43afcd81abc4821ef5d8b392b67be2 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a0045997939c976a7ea8881490c533492aeaf25 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c6050acb62d50a9147f60f573999e1aa9867bc10ed64d80653a35cc63f20cd7 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa8ce92c38b71d767dda63540a7ac16fc779b29b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3cf843cd2921456a083bd15dffd7da2d58a367210b00c1094af31aa90673f230 +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..344c214df2130049bed1f1feb043729b25dbd585 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:73cf3e5dc93983dfe115b678275988e5c7ee4b48f686c0ec85412c2cb971e41e +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..589fb298d4fd8e5960854a638585085f9daab08b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f9a5ae2c4f6bb2637c1a2324b9ddb76b3d159ed0c3edb967728766e76125d4f +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9addb07baee8f5c362ef7247fe59b9d7bf0f197 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39a115ff7a78557819c4a420b2b6145ed29e5d9cf14dc75299dafda0c7bdbad7 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..af9f0213769d6a9582167ef5403690fb637971b9 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aecb82c184e05d73d2e847d69343fae8abcab8e11bddf14c96b02929f93f0c7f +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4a6162858233efb413f4cd59e5fef2fad835b50 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2f28496875c895dd749ebeea9564be810b3b6fe47670b8b94c63b156c81419b +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..309d68fc7c4ec17d74c0ccc475f70b1cf01d1b93 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec378a3ae233da476abcb7739c8c6438faf8595d0f9836e7b73511d5d604aa8a +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a2a0f2a8b227196fbbc92b560c8ebf943d92a04b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c4572ae1966fbadd5c2df969641a25c011764cafed91c599e90d87ffb8df8b9 +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bbc4c3191c676050a66ab5189ae113434f652707 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dcd92afd9b3eccf9a3595931cf65fcb7593c52b46602c41d743040deb79ffc1 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e17937da95b0bff385a001b66a24d0b09e903e8 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b179851d9606783dde7887e52708b396546a838668209c9713f9595e18ab0b38 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0eba580d67c9bc767b7677532293d1ac5ed5d197 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:090ad0e2fb729d10f4b8ee60c701b159787b402001038de29e812c1cba124bfc +size 199058669 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eac393a7a50a2534f35228c8ac08b28d3092c3ff --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3a40ea23e2e491ae9887b3af0b3a7923b1f585f9c6b428974786525c42096973 +size 199058669 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d62d7c721d141cc39def9a019f469bc9ec2b5d4 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4c5c559efac0ff9a0ab604d867dee21c598889b4ce768c90c4b5efbf82acbba +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39745ee85ff651765ba93c55508ab4a7c79f8b28 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe1e17c9bbd4750ca8d243da56dc7e7fd86361c5d334c97fed432a7e1e5048b2 +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d9b03b0c3a45e59ee33298d5e0c22da239ffc09 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1ce30deaa84cf959f49308626b6a15126854ea5fe5fdba2caed81b02304d7b94 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3d81468aef729bbd8c048ce887f478ce4792f00 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d76a2316eb8979271b5daea31e804d448c793e7662864fb5c4dcca9107d27cc +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52901cd77ca81fed96b99e9d31701bc83dcd28e1 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4cef2bcdea57d90b15091d2904946d982cd51d583b92b5099ecef400ca02739a +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e3dbdac1028ee077add5bb3c48285aeb0970e04 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c93370921065828439b87bb63a05e7b08ec60582be2399af1182a4ffb9ba473 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63dd65fd6bef1de1cbf2de0d663462e6ab68ae2f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c81eb665c84946692daa4afa4e492018e453a74487e9ea0113eb6e88419175a2 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26b2814ec287c1bef1d171c58c3fd561f2d13924 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d15ba4ef9aa9a593eab7025fe6ebdcd8223758237ebd4f632aa5140cbe5f23a +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60a5694e4a7c193632c34929dddee9eab57de6bf --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:326b85a0585d2dd874c5286d6b76604010ea220a1ea1b2e407fcbe447c993979 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8973326b83922f08ac1fd69c3d65f867f0d1523 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e505921d12e2bb3ae35410618b72cfc31f0e0da296a80ad2fc700a9e54f597e6 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3192d7767c5b6f9cc96b26492f996dba6a0352d4 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b1f95d004538abc9fc48648e9b0b257f279d04d23d4b4682ec165778572a7b8 +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0578e5394c315117cbd55bf4561f501c896c5ecf --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9856bcc60e38b0ceb3a188d1cf04d6b1b1a0c59fc770fc74c4fd1a3405a2a987 +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25ca064efc2a7ae543adee62bd4cdcf924a7b53b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2949a05f89c531a41cdf855ec6b40ca5975da54b8c4308f860c27b5c7d258b9f +size 199058605 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b19c22be1ea62a87b12540186fd4aaed2ff1f725 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9a2d3c57e6186d660d38614fab9310061d824c069cb998318d03db3032b5f1d4 +size 199058605 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62313a6bd8df5990a1bb9e0f6fab18484108656d --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:90411d16c096bbca90f0c78052afe510764e537266a45f8ac711c3129b11d76a +size 199058669 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fac4173471738abbb961bbdd918ea22bbbb63dfc --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d33fc79202d6fc7d9a26432a4318648f40dca8d654e2c3a07967a4a73fc8a12b +size 199058669 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e6b3a654b6e7a616f1697db27ca82be2a24beac --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:093553b1c17085c0c4885b1ebc6465d0a617bfd3a4a52195a5a882bec0a768c2 +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ab242693869e89750b1a3f659bf168fd9f62b95 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9ee1a2e65dd22ccbff83e10e5700638854370b5b436f1ff1c7ddeb9cd0a566ca +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..25748f5c9a8fe2d0c0ef52b06a797a789fa0fd6c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27971695c22367db866b5fbf8700f77116dd70384be2c89205a7f5bbec209678 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ea47b6b90c1838f3f5738dea0e51f46957ebc3e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dae59ead894223002a2dbf7cb5aaf92f4179e69001511f7699bd0563805a720b +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd6bcd6a557b050836fa083aa6169ad04034bc2e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9518fbd0ce2118d735b47ac1aa2345ab3b382828a0517cec2df20467c06d847 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..545b345309965a44b99c14f34a78661720df4853 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a714829c87ac6affaefed026a4a592464f56afe95fd9dea58ba942846b6b6de +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e2447282020db5aed7d7d06b64724ad5ceee2c0b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5971c9da4d92cf8d5c15fb9f9c5ce9a610800c3ec4ea12a1e23b3a99be1aac0 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6423bc38ba28bada1d8ab9b7109baf6157f6a7f1 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34e53fe79a2a12c54a1754eedd88231cf38f36b50941538be4a2a6fdcf3cd66d +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97c086d49adf079a771b4070f612b727d8333650 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0d8c92eb02e23f4f6f8f8a94b53e86e6120b71fa246fa297330754cd08566fb +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5930e0f3b06624426283d6883bfcb5fa6efc0b52 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e0c622324eccf275864c09c078258921dcc12b0415dea7a9f090f77eac5db594 +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5fcb354568c96599368d491a690b9c4e43b631e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44cdef6bb043d55b5039b6909d64f6c8fce049f84b5040bd90bcc687011bf446 +size 199058669 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..86fb86878593d3d837086e1ec0595e59683f75ae --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1411b7f8fa3dbe04796258950fa224d1e4f6279ae85e7f1650b522f399adf0eb +size 199058669 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5493f512f6afec88a4cd01ee6962a4b2851dd01a --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a02054d7f445ffd02678dbe6adc43869be00cd4e52f7d4853f542a3faebd4510 +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8e497c6ad054e81cb94821ea80780987b7ec36c6 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83539ac4628d70603c50911f6ea499d335ac49357e3c756da6ed63c77f3eef9d +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b73a9608e6f35cc7209a57528e841cf73e815460 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e27f3f09bc704ac4765ab4facadd298c938418fa88aca5d125832268164d373c +size 199058669 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c037df86dc5c13f762eb4f2eb062b2d0f500b594 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7868af66f1bb9255e58bf7545bae1a68f8ec40ef3fa88a2fe9e58eb2690881d +size 199058669 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5fb8964c0ce774769f1fd89c0f57abfde8dd0be --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:38e4637932a1b733fb1995a612fedcb80171238137731940dea3114802febc75 +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d858726f1f2efa81e5154d0a6702448bf1fab094 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9de0d8477cc48449cd77c477749bab66fdbc2ff0e3a65bdbc2072721cb0d2f18 +size 199058797 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31b97235024a59c64b0b54a48a2ca48eb9d4c05c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac712082a8d35822cb23b9826f2437584da5a0389a3e1f5c69bf4a6dbe574cf7 +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7184d337413350221415e9a6edd3d8692cc51ecf --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:520eb081be4de673cc3599afa705694fb97d2d914f856283754078d33eaf515a +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d22eaa14a5ef6c01968924639549213fa96ef675 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1953d265dc781614660d8552e0a7a0b2fd8dfd183762cf0734b2740a44b6978a +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9606e3ce16ecbd30c46b353e9ff357211d78fba --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1642d3eb0729028f6b6752636a385c8356cf8fdd8a53f233dbb14e9bb777920f +size 199058733 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..931c6b53b9d09a1e8478a2df395106fe5bdaecf7 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c54b9428a0461743457e3dbeefd5a91708d0586b410df27ea09caa8549977307 +size 199058669 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8a525a959e5bb0aa37bc47fc7dd80c65b447dd0 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:756d41178432abcc027111686ea3b762cfc334d43789187633f748b377e4a1df +size 199058669 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a17c01c37714ae570a80ee261c11e69a69559786 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7026f75572af0bdd330736949d9e0484e480297977074c478e88c22c575e228 +size 199058925 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36ee55b51c18321744ec7580f59f6b7f702a1420 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:512cddb6d70700773f39ba68e11e2e4af29f6c96b09077f75e9b82b03dbc3ae7 +size 199058925 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..98b1c609ffda638f25ee5aa8985d6348e9cc91d5 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:85469b4f600ea4ada777e8ad1c233e9a34b7909d0e5f9a85df969506f709a091 +size 199058605 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99b40254ce311d7818e128095a272b4352c503eb --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:913cc6815207cf72c74171aea600c708594bf64467cd3b056eb26fb1513b9868 +size 199058605 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac9ffb3be800e573e28ba683c12d3d72f906c701 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bd09894e6f3d4e3ebaa949d8a95eb2fc1a6968effa43deef24f926eb23fdb70 +size 199058605 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb37c5ce8d95c751875cc541b5a4b97cf1325c6b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a54120d1ef8bd8db5b58961e11361472d72c1df2a4ead71cea9d695f7249486c +size 199058605 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23bae23173cfb04fe40fc8b3a5a9d2874194c294 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:054e85c49266c8258ab325382fa9ea730f5870361c428e5db6200a3cb877a4ac +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a5ecbb40e2d5ab8be713882d31a32f4efbf18c75 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96882f5212439fa90e9493f8526b7926a3d924be62cb0fd9ae259f52cb2d48e8 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef3083a06a3902fb2dc25e41a14bf261e9c361e2 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:232427e711cc39587eafe32ef2b65f95b2b7e0b207c983763f1389a1733b2a46 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c1f1f91cef190bd4d8e7f8b88f7e68002d6de05 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ae551806a17a909867124b68eaa4bf32e5058642dcf25fc718188315dbf65946 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e9a6e105dfbf7b4f17fe28435e9f86443bddbe0 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1499ec7b386494716d0c884899b7874ee6af99b06182eaeeb6687bdc2a428596 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b09650d47f26d1c7ebdd228540529fcf5b7d598c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:94812e6ecd8e5ac7501797a8484a4f5ba5378446e026324fb3692bffe32f29e2 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5d9fbdb0991186f85d022de0eb3a45ffe16f5912 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:62b86d189baf80dc4e4a8048e9f8f2b4e3d3651ba9fed1a5eb1fbfd29cf05cd3 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..690c9b6ce3d114f417873362a40617bd1e1617de --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cbc382075e7b7dc56812de307e70d797d667b8e37c134158de4503ecc9506a5 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b0618e3e310101d1ad6054fa8bae2fbefbbb2a62 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:486db19fc3d2d1dbea4c382ea131992dd6efdc1608af43050795d55c9ac88439 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b694903a917df7da463341319730b99e9656f8d6 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d743f435be41f4c6da79b1dea1d8f3ee5c8349803565e1f70927248bfadc46bf +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bac2dbdaeaa774abe4e670d4de7fa99ead915c0 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ccb834a6fcdb3fd40b1544c5302fb2aad2466d545dbc5a715c2eea90704dc28 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9456b5239853c3de94e8615ce614474497abaa23 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:939137b20af71b68c6aec02deb6d7828ee0a1e55632b44c775f1955fc331d684 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8253e0c1709b1261858c5062bc6db887000d9fab --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78f3745285008c5ccf969735bd80a545bb1534395318ab1530fdf322ea7b5467 +size 199058978 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2a1e8aa536e16efdfd3418ed8644798a11614513 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31bac67e4a70eba86cdddb58b1de17417c167e4568f24ec2acccac630ee77f80 +size 199058978 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2766d170e64b013faa9acee7016dc2dd0fd9d647 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44f304d05f35e9f396405daea3be7c328a966395d362b3baaad1eb2ef0a41cda +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90b8ccda11624737f36a3522756acf36c3da707c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7825a415d8c36b30c2c37245f9409a6d2b36750fb050d433487dacf3831954c +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8bb1409d9effa770d5a40ed2da847b9bcd9fa474 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a546875b0374bb39482e3709457a1c037cb1f9c160a3766988901c714742bce +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5476b0993b5d3d04812999dc1ee27c765679cf62 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed9cab6ffeeb81166c7013439af5ad706f943e6e9a5fc797d70eed9c4fdd7ab3 +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ed2110d93155dead3e3f01b5cb88b190808885e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3690ae4dad09d23bc5cec78bbc2879292c2f6aaff526f6835b19e3c592c23854 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..724af2bbaf8036247d9aca866918dde376c84063 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dccb6d7e5039c71efe5f61486962a51f1eddc4858f939e9e08d7226139634078 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b8650e29883eba2ed961e82ee2e35fcabdbf4947 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3eb48a625c21e252255d4d068350f68a1403cd4ef0c5cb83697e4c5179ac6a9f +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d17e75e15b7d11656bdc83ef0af9cffa6fbaf08 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3f3e6d09ca490196ab1a9dc2e93c368d992e42c7d2a8bb39f8c64f66c4dc1cf6 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2c6ad9640b0a33dad91f215a71e3f18dc7c33bd4 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e51ee77a002919ec4e26d82dcc329e1e27a647d8b72ef9ab2d0535273091502 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77f4bc59c3a8db872ac8d757df7de7328e65b8e1 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdae2267e6c68ef576872130b680942583f63f86d5579379201ee4fe116c5203 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f99961c7e5f9279edfd74d8b51f66a13dfeaa5b3 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54e63d8688d7f07670bef2f6043a0048b632048833f3fdee90f63852cb3d07b3 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..47524216d5241dbba3511772e9b2d1787d3ecbdc --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e22d75be6df0111871738c4ba3cf698433ce221bfca5fe15ea14515046bc52e1 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b95ebb945d76c85df445e2706a92e1597c3db14 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a93d7f434542e267b2ec05e3914ec846976b83d3813857bafe112509d5703f14 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ef0866b1c450ad4a225e887dbd8fbe75e897490 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64a380a32cce2575d328ba0e227caf39fac45f56879a33652c5dd569dadb50a9 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dadacc4368ccacec7733d758b855b19c4d143f70 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2ae78fd35ee62407b46fc2223f27efa1979f28c3b1802130fe25f22ad71180d +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9ae1dee5e73ae45d04e24f259cb59e08d95eabf9 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e2db0ba03897c459cbf632a50011b31c94c85f60390e4eeb66be9ab3b4e3dfb8 +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62ae4aae7d516653f096f9bd61f9a19c623aef82 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5845c5d2c9a717566129874ae505fafbb248aaeb60cde9a6cd9def338ad50d01 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..705e2160dcd3073a7f6b2fee15f2fef2df0386d6 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d4e52741c589dd3509ccf15b5ae183f9b2c0548ff8231ae366e99693dea59391 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ad682332a60bb07b0a27743e89a932e7c98ea1d --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2304dfe3921022dd4768217dc5b169e8ed3a726ece46828af22f6a0a99fe32d +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ffcd47ed6f2389decba5c7f9a19a16a57a0a5b39 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3334614456514f05c6fde955f9ea67f4848f3020ea53f058bfecfabb97e0f891 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cef2ca6d6c3b4c8db76d169c2b40bbe22cf41712 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88f71a2699d2fc4eca39689fd042deb309fb05d2c6e4911f5b3d43dca16c4235 +size 199058594 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..234e868ab4c8708db87a912b3e89d6de38ae7655 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be84782ab24ab392a1b5f70d8d63ea5a74999441c944db84182b720f7c528804 +size 199058594 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f889ef3a44886b3862aae0b0b41119540f05c2e1 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bc6edd2e5f35c77474159af15c54dbaed603ebaf02ba42c44543feb282c1bdd6 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97239e8e45f8c1f2006fa7692ba0e5a118ba04e4 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02d2a44e7dc42afd5dfc17d2fb7404c6073351ae6cc506988b850f2de4537482 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52bdb23af8c26c5536b997d0e57c14795286314f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b7ee9531a75944fd1f5184ec4a13ef9d7baeab8ec2490dae986558aec864a940 +size 199058711 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..310c25f48fefb0830c53f8d45a6271354d12c53b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b9a212175f47430011d3638fef4b3b2a9ead553aa1b04f0b4be5aee4553f4af1 +size 199058711 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc3e17827673dd50c6d8115db260eea2405b194a --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c2bc83abf0166654926a16289ce43a59f9c79643786555ca9780be3e28f074fd +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d3e3b65cf5d0073addded50e797f1c24925fac6 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de939ae86b47e2723e33cf455215ca1afa8e251ea35e3c02a1929ae11f59847d +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f62749b8188430736c2c72843555e1323505731 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9761009e0192a3212dc4efd734bcbf20665731a6ff94d1f62a309a6552e49ca +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ccb4c98901462b3f1f00c58ff256043fd2cfe692 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69735a4eef89cac3538f5272750db77d15aac6552fd8a9220baafed1cf1f9351 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e39405b071d35520ca9a641e293ea3287d3182f1 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b130b8075f734245ba453680bd69f37b95686354b98c228869103031bdf9ae3 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dadbc97b3652ec9779218bdf0153e1553a0b11ec --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:88014adb80708d35923c4ca8e203b7d6911326ad64fff96f2ef9e8e92004c109 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2721cc948153a17a866d89bc17d671185f2160b9 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:defe44684212134b0cb6eeb856a20b7dbbe802092bf5aef6cdd90c90d7ca2d16 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..57ccf107a22fb5f3cc50b6ffa5de2ee3f8374e20 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bfd4e3fa68081d7e2fc4fb148341cad847a200340a8ca55a154d32921c41142 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..056e5f68af06f711add752b1b7022056544de448 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f7c40897d1724be0781e2645b9aed5004f2248fb514b1401214d6806823a2c3 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e6068b6032352271c777428d8984cdfc111bcf20 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9956218f97b6b78c20cd3ade75d8b6705b909c1640691f2ea339705778c956e +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e4b064bdcf5cf3777051d1d606a4919268aaafd --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0cfc540f2752c6479206289b5abafaf8a3cdd06d23da971d0f0fdcbdc552b10 +size 199058594 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf9cae69a1a7c35ff8a68c058e5e76c9063a5542 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa14c55cacc6b45441470f2a396bdc8805d57e63a9f59ca7a12d028d1dced12a +size 199058594 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22ab31f36985e9709a9ac68616eaa7b1c3853ad3 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7bac8d0d4a650991fce47eb985d1228bab6ef0de4bf69ba84924b55653fb723b +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46a1c61db44a61d3e6e1e711ad588e59258e86c2 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2889258047e2f1a599eaf12032545444f01a5b100e91502afd98f703e629e27 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b32a8ec548aaa941d860961d353f65f30077b88 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7932b65eb38bb678275c6dd0278f753712032ea1da48c9e8055046016c9300c0 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2ca4b75bd3bfb5b717ac75df8d0e868e934a27c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ea3c7087aa8afc4866d5bc60f12c1233db26da2f1d0610dc9dc346bc6e1d733 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9282dbd321a86fc41c59e6abb29237154c72307 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a6416ff94d1e809f3750470e3d817ca3ab0d02c2906a5d1be16bc72d65373af +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bb053dcc04262c4ff0c587e8d62584c9fde703a0 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:13b8538dc37c8c486e3dc3dc1fe2c4c0800eeacde2e8f1f126a7c54c601e396b +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63403b7180c7fd3be1b44037887b24bd972eb569 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32fcb46c9aa0bb423a6f7bd691e6c4bac620b73c3a33b40ede0c4c9f4ffe69e6 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c5f0da0a2fe10cbc00fc48b207e762518b8f86dd --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5aaf116d0040ef776ff7d7bb71d13a4df124b97f9f62a68d6f68a15c72d0d798 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c14ca5cae88ed8fe29fe611ed261b7a54ca7b0ef --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91a0c483196cc8749e967d78009eb80dbb15bb6e572377ee1ec9da7f62e4c127 +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f35cfd9d00f492d8c0d3a9743b77385803b2eba1 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bed5d2fa179b5dd50c2a9ec9a082edc9808329a81d85afacaaccb0a4c00c5e35 +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d91d22a8ebb54d071238c2a083387fd03f6ab73e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f748982480016d83c2a38d49e6b33827fa2f8c89170cb573a75fde61ba43472 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d5df8d1674eb33142e140b6578978d67e629f7e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad7ab8781006c3dd4d8e15ba422d902aaf6de5aa326956246ae58c4df11b5ab3 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..253f0304edf15e81551436b27751e4acddd608f3 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a6cb72e911194149e865d4e25ae969d7e5249c9c5b50bdcd606c785b080f052 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..27e08b9158f46f9d1d8185f82a6e7c2379651a4c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:caa067a3543ad980a2330afbe7b7d57b90aa45c8f002be16d79c3e16fb7e79d9 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..11704544d374d7d0e340ae58234c943715dae0b4 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c374f3501a48db4e1bed39b0010f80d0d5ec74b1ffc81bcb56ab524674202a3c +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8eb9c74566972aea79f44cb57f1dfa67d4836c42 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78ed48b2b291d21aebc72d81cdd0c85eeda241c8ccc43bbee6ebb4655db52d56 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..544a692b7425fa8a5292a756fff76f70e7f88e5e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f6c4541aeb6dcb3b67e20319219ebf97a22296639c1a94cf5477c8e8a528d167 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..91d27bffcbd44ea8ed9a96050fbc1b0f483a79ec --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0e0e0d72b30421b644b056f39f981bd4417662aff5495791a77edbf8510e35d5 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec637199d0e2cf653b8ac9bf7fc1f8d6e2f25c51 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d25bdbbda8201cb0b443e5caa28a4490b997a516c00a2b6ddaf6ff07ccde4e47 +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e86be826aba049f4536581609f7ee6c405b5c7ef --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:162dc3509d0c76be7a0a5a26fb087bf69568c6be6e4eadeeb1c4b80b9b7ad855 +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d3a2251f67b26490df4713091430b2cc90c8b6b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7f970dfc5812a0c3dc47a0e4eb53e77ea5c862932a7da70c28cb5629e42dd2c1 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd909cccf387182b2afa02616c6715b1fff62a88 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c49dba585a30e201c742c0bb09fcf9244df957091c9ceba755b36b9e7a544afc +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c87bb339b2a9780a521edd3002ea693ad6a1f75 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:275bb6d61a3301ac5d4bcaa5daacee51495e5c2ac6d01d794c176482ae3fac9c +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..15e393b201c9b378a6f0db5d3417c881255dec57 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1a5cfedd21be2e37e00b9ff9328711989795be11a03590d67e954418dd5454b +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed2658dee8b833184d690b96fafc50fb5b4da970 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ec69cdff16d078e83ba9d2586561d5e7a0a2c7c2c90e20b6a8f5fe5c00bd3e98 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d66c1506ac0f21d5c6a3b7d54d7471569d846cdc --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d5c33c4205e9cb5fe7523de0c7b952ab92bd53f98620f51ef19f195068f7a086 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cdd9d8c5b549287578bef7556dcf65e60385546 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:64003b6f04793a926d81a643cc29344756a65554a6c7af598c5c18c9f547196e +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e94bbe7af67b83b7215fc66a42cc25a961bfc45 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7356e1a1aa85f7123dc46e40016734f8c1c9d744f5930e1d1e685def701429b8 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eb830a491062e3784483f9c55359ecb3b2585dfe --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be8b2f390cf13d86aedeb576c5a019e73e02b81296367cc3ebf3da240308e539 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..70409c70a3ea41264f21e073d0a48011a2102043 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d2ce368102a3271054404914e26b9122ded2bea3977712b2e1926b022b50347 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f7726d8cba65202e6cd076f56a98aa515a7cd8b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f15ff0da97a16fbc49b107b130444049247bcf9ff773aec7aeac68e40b9e4a3b +size 199058775 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..561a501fe45cf84021b9b782360bd3b7b2f8ec5c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7b22d27b5f66f4ccbdb43a30f0c5bb1dce29c28fa72ada8b9d18f9bfc9defe8 +size 199058775 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8b0d3ed887a008fb30388fab0c68434a448bfa44 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe09ffe39f75338b60b26d187b66de9f7a12eec4f988333a9f7780a8bbe856ff +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d52851444150083e13220350ab152625220cd8c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f42dec4419e4560199935df69fdc2b7c8ee9b0bc8bd0d2f834947bd53fe653d +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f65641cbdf533538e9f6c7f591b401534229092 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1eb7b9bef1265956fe6d1e8902b4f3ad5cfda312f9ee00b96d13f0773db1ac6 +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c58707129bb469b67dc965f9973f747b102c106 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a624f3f6723b3d03e22175fbaf1156c3cd913f4d4c7dc41fcfec037c4852691 +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ec8b2030cf7ffdcb3bf25980c884736e7a02286 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad98550ff6533181a21f05ae367b9049fd35702ac9816a16be94745aaa055264 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6930aac000a765fffc556ca266b95b19897ef2c1 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6709cd302cca50f30feaa7b2b99a91a258945c3777f88c8f7f4c0918d60cf162 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac70f8866505443a0b1a6cacc37b3037f7bc4d92 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7908ac4cb7baf9c3cff995b9d3d8e4a64b497dc54b613d39f8139bbbc8301bcd +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..28d93958a07085403a6c3f2f79ac8a5c8b8e7e32 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9bf25774d9d670df76bc3b4f246dcb25ef7febee43c85c3c32d91ac8140ce26c +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1b648e3cce7f2644421daae610307ce5377ffdf --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:decbd9ac39c124ee9dae2cb22f15e1e5c850c0b8fa0fff6ab8ace73356bbd335 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7e75db9f67fa87d56adbd035a82d2de493684bc3 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:32a12f3835c15e9970a368003068f73fc68b4154d16ad6b77555031fe636fa66 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99d3fd279cb400b1180ad3bf68dcbea86088544c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c869b2b2d373c5657982dcbcec5aecf7ed37b98567fbd420e703660e1c750db7 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a5c32a8b1c04448daa95c0645412d0beccd178e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a79bbc96bdc7be3f640b6cdb827371555631cbc70d0d559e9cf2bdd29d78bb8 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49918fdc58e617a703ff59f2e6025aa38c31b636 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:341cc19ee906c1e92c2eed288350c02a0d0bea0fcfeb5bc8b8ca48668fe3a968 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a979c648ad14775c293f7ed9d83f36b130d995b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d5c6a241526df5f87b1d804a80fdfce9d8e8beb9cdd70f260a924d9ec164ebf +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b2b02cb49236c2d13aadb130a43a154a08cf50d0 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:294e44bf3d92e594a477bcfcb54f5f9a31c215ce9c5ed62d216ad7311de1ad15 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19d7cf1f3d4990bc3551b245938c06e4b03eb9cb --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f7104166ac28982afaf938882945e62707a9cbd7751dae6dafea0e5d95a1665 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a96107672308bb49dfe4245e2a7645602495a757 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:255fe90792061277fcd1646b2a70901630bd2aa817b440248b6d84a193248313 +size 199058914 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ba6c5ddb3a5bf161084dd4fd909db1bcc6e7f14 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a29bd2f6d77bb14a3d5b22fede00f9e7b297418d1128939128566af19ed2caac +size 199058914 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a89f904a84534f3de05dd60236670ce05f36888 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:257fc341e2b5e3821ccb056120ec23cb77ef3bd89a8e3a220c1148985d403a38 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..288c7a0c0d5984fba847b23910699125978c5d6f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c066d2856294251f035f3af27d9a0dec2e6694e9a4b9316ca7357cf38a634a0 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1edac6dcfd4b3ad4a4253eccdc0ba56b44370df --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4e4bd87d704c2abc2bfc4a7b3e71a8968ad08e3668c6a8c9b581cf8704cb041d +size 199058711 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f27306cf4b335244fabcdf221186480d92d218a7 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0ab49ccee0c05f50db645641a2a28e998f2eafcb4c2f7d53f77f4c9f98a815ec +size 199058711 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1393e7c28011a61a9dcfcc326fc0307c1941d95 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:770803d9760ed5abf096c83847a894af51b9cd8823d3a5a642e4077531fde92e +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85d0c691f16f53946a93ec96e3318b1a8d809431 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ce5c1a32a9e05b0d809921fe50d5941a801132fe890d97b2c314ab09bdc5a2b6 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7951de4b8110ae0be7fee9ec2786d101bf1b46c7 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:622006967f3694d8b43593692ae948849b16c9d884bff2bd7ddd0d5e86d9213a +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ce9acd1b111557a960930c0f3dea29edfc203cb --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6830d7ab4587f537efee9cf95df3c1a1b3dcf293cf210ff6b4b3952ec3c48e61 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..48b6fa9c04fb2d67421386991e0520a5bb92cb03 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fcbfe49071306bd63b5a0a3f8e8506fdfb4a381cf9e10a67fd03a48fe2f74da9 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..011701a261e3f6dfab2c852ff5d4d56c3d444cf3 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6dc88df0f752e4803c9d21e19f4f28a7ab5c050e873783b21ae7018700588bc9 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fce700f12cd4057e023109ae83219f0394b9dcdf --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a421c73662672f8eae8478cdfd98fa440204aedcfdb9af5dcaab9cfa39c55b6 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..685f09090737fe10634b4c3db53c53b57f239f10 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6de781c889575158061f9cfc516416996425d72e7b0a5f31919683dcfc2193c9 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed75f9d2f96cdac98b71f39eff9dc67dee71b8f1 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ffb9216c9175fb44f2ce8ed7e8d8d8d0f7e9db31e51aa96088bb7dc00d2fd443 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b983206a91dea2db9d3358ea68f34ce67bc83f1f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:79ac62efaa446d599e3fcf02c0960db12d4804f476ec75e5495fdf68a71cdc75 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..beb911cff73dd80e1f97092e04be5fef308dcb5e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c289860900508dc7a78ca3fcac105bb4e0dc947ada393ee72b2dd52de58de418 +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79e90ce8b042f15ca593fdc727c38bc99caa6853 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a931827791aadbb859b3b6fc5f10727480ae43c1c11a66d5386c6f4ddb8f657 +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b33777510246c23b70993aeae76805db5f3d3094 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9dc0831bfea75dddeb4c88643eb0ec984120c0d883b205111f5c153e148dab52 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f784d88732ede1e1789df7f6ade235e599e2a09f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2989cd75e2df0ed5f2632105d924a4bec34ecd4f18471d07598149a329919236 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3d2d6b29ba863b1881ff80c6d126a93278f52ac --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac957eef951caca14032cf082be5541a5e8c9d2378d03aa1a9a9694ff2fd43c6 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0f8cfcb8a622ab81a0c942eca425e2df820df06a --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dac0c45d1f76cf2d716374672b69d3004d7aac131faec021fed93eaab9b246a7 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7421565e9bbd99af5e5899d55533ac2d4af5741f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:204313109f76c9cf7ecd73b1d316ef1dfc4662cefdceec22be16ee78dd93889c +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1430e24a58e029e9f618e767cb67791fc28987c6 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:872b756432553df48bc0e01531f613d2a3a5dc815462685230ca84b692471f49 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21f9bfc0c5912f56230ad7828443183db745027a --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dbde537e716019dc7695606a5b17605ae627a11ae007737639210e6d46248792 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef794fcf430659538ed3dcb4e172d5f285048a0b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ef220464ea5cda8e22f2da1a0bdcef46c477ee93a7b75b79279e3a467be9654 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5987b95b0694ee833016203d8eb442b7febc400f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26c6536b4958f19757eb6a918adaf4e0e1190285278f15b39f765a8f81c5aa38 +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b022cd24a0189f336511dc04a256320960b6ccb --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a08b99ca858dd6ed74ee6b1d066f6e1dd003988c53f500583cc222d06c3fd99e +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..db4f6ec6d6f2ea4a496b0e170b9d021b99274121 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d00cecfcd64c1aa61d33886fd7a0b2effcabc378d7e8e0f9bcebbd0a513b2c0a +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a28d297e3661a1e840337db4f24a01310a8e58f1 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:720cd6632971b3461e56b04f3aecf669f787555975dfe933b718d67bb8d87446 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5535677f5619970247e94650ebc3fdae6880726 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e695bde83ae8202cd2ca9a56baf244c3ecccb6a05d80c417efcda4bff09911e6 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d2c4035b69a577bf009659f0352a40cdeaa810b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7ff1f02e7320d4091ad56ed015f0d52248086f9d71a6dfea22a5010fedce6ae9 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ab2a0a720d445e45066509e687b9d341e12a1668 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42bade9224196be4c2bf4d6e0e774098747b59a5910956d24efdeb1978fb4c96 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc7244c5ec14ac69a83b5f085b6b63b1ef60a935 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c0b7b88828bd62da8a1d8fcee4f58e3bc80b64fd139057c06f3b72ceb4bb28a +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99971f92a4f3853ae5efa89d185905a2019583b7 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:142c7e0c64a5ad7d7ef192c01320e082fdb5a3581555d182f3e33718b9004be8 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bf8e5df9c17e8299c3e89829fd56e8ab94271e8 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:60d704998766ef5a3d018f9181fda71128389b616326e498d107b187f63c06eb +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f81ddbd111dbc266b98216a49c2d298fbc85e875 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7b8f846ce5096e8604eb787ef62c9cd71d36a35036f93203b0415a3d50ff76a4 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3f092e593259a48ab9c8b904064815f0fa72013 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:834327b6c10ac2178fea4c2d3a8d5340756960cb5a1173434680c7467bcb1f26 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ea0806da3a8d0d8049e8f52edf52491469771e2 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ead29c5ca9594707218e53800ebc5b4a3673c229a07ce69092a19926a5172e6 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..97e66ac2673b393f8f001733f6afbef05df7d052 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7aa90c30602cce759d95625977530befc96dca7e49390fd7ab31e6f9cf8f50fe +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..69cd38bd929aa382e2b177a370f2f48b007d866d --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fba29f604bbeda71c40b53e3248656d33f76a6042333c963dfa6f26712296c9b +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..604ab1eec6d17eb1056255f6b1d788a13a31e5b8 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cf89e1e637d5bdbd7b63471ac9f0bab23cb36a11581c70fc1297eb8aa49b528 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c981f764a7344fc091ffa2f5d65231e8e6b44223 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1990921fb1609e0e788e6a321c9873ea15f4afe5a33b6fff8de9bb70dbf1361e +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4ead0d0876d34504e4e19bf70ee6156ba6a6dc7 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:34ecd499df2a4b762eeb4d310b8ed0a4c588883723009ed677474d2a5f77f217 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..743ec23b379c5697fe5c8164b29b245eb8944ab3 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5120e1d31c49e4bc3202cce764d6861ef26de68b2a4a813357812d55345da0a9 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dbb2e688bae1e15e87a690cfb8f40a74df29950c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2dd636a0377237a68e1c11c64c311e88f6170304780f3d0282161aa55e1040b9 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c7706f2741a16e3ff6f9ecbbd6d17478f842f820 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:afd99d2244c300fe8cbe43dcfa70c38717a8cca7052bb96753b9ead34d652846 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e70bf3fc2c43f32e0530aded29774cb0a6b9e98f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738a430b824da702cbf05e8b52f9b83cacaf3d33feaed06714a35bf42d4b1c7b +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f7c673c512bc447b64978eda5252fad9f7f094b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a88bb1f1ff90f69e62792622f5d9e3833035c47ff64e7ac1486493cd3fa21e7a +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..beb46b418707055e31452d7402b2e6576a1d0b90 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c16c0cabaf389efa026a3aa48a43f2f5360338ae9280fe70fec5e6b722edb05 +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4eb8199e7af7674d8c679ad8849353b2da7bb2a --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb3a0339b4a2053fc24af3aa12b4e586d44a806fe212119177b4a1452665dbec +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eccb02cc0de70784bcbedb935373b8c241d60041 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:448378aef64977c912353543bac6ce0abe7c6a31d0986423a721f15031819c66 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..871b59e7f8fc6431057d20c07d10d3a47ad5b3aa --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:be99eebdccf9c4cefdde168f70a6b51b57fb9adcf3dc71dd4888572645238faa +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a42daf68e635ebfc97080a0ce4b8cca6f112d0f7 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e842072ece5e3d4d651b172f4a65835d7f3187f6dd6d90e21f1267600d39747b +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c0c760efdd665a08902bca397e4d965e25b7b0cf --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:678b21ea8e6f794c2a35383404cd9665a09546b31b6d6eaa1ab6f1c5b5663438 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e12832fc58b848285d080fbd81b506ad7ff5485a --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c8678763af7f124103d83d42427e25125d19f7ac8d7521005d03b78e17f80509 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0cf44ca4753799393fbb9f8bdc1b58871c3bc16e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1bb443f9b51d6cff698de26d3c3c1c3765494590dd2ae31137ffba8a726fe96 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd44c46ae227fbceb18fae4028b97e09cb859dba --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8fc90f6ff470158055baed598c7bdac2e6eb09c1355f61f235e628ee85ef8536 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0b8d4820aec69bc419e16196f054569ed82748a3 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5b07f764c1f05f2144e8341af76f5b8309f4f3645bbe2710ddacfba828c4b188 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d57205ff8e4b1c0c3173baa271e60eb1f8996426 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c874df0bd67d6100a351801bb3f0598ba83a33e674f742a59ead5e1127c649cd +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4bdc550ff5fad4366623e5b5d83b97f0c8d6d101 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d79eeaa7482470f822ce6bb3a7568b17a8e11db8355bf273c26472af9d9248c +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e12d537510331239605066dead7b56984649783 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8f2b335a8e14564e75511c0bd90a897d8481c2d8a733196a5324556c3442a3d +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4e763d0a35195d7157d2e4a5f6ede89b68cd784e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8301d81c8fd7e820c044e3505ecdd1c293540092c2498a8590a931a71212b1e2 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3ce8311607d67253eefb38bcf99a2eec17e9897 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35da3af216ebf2969cec737e9c8e0c91c6f06e24cdeb9142f3abc00f78bfcd27 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..391699eda93aa2c1663bd9a80a618e65dc751244 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acf4c90c035b60a180a8335cc0e9242276ac378729815579c39209f425f587db +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..38d0d05bf79bef93d62a5ad7eade7494b16fbea8 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4dbef16c0f72049234b8b0b705bcdbca4ae0bb4e4572a8fe9980f72d8787610a +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8092874ec49ab04f5f4582c7fbdba1ec29b27811 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:baf9dbe463abfe54ab73052fc4baaadd73b582626f34b08e9cec0d49e97d37af +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7876ff54b7096c599e7092500c799721a5ebe45c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07cee03a007f79fe9017fc6ae59c92bb725bc5d296074240947e1276fcc98fde +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9a080edfaeaed5f65a46868a60d70baf7bd0f13 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad7e6a7abde228042a2bea0e708e8484b3e4add52b53a7ec7b1e9eb55d5c0988 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83312542160abe3df225fd4b7a992e822dcc3c7a --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c20966fb8507d07f1c1313876855f57cfc2678cefc6d1fc5468b17b521846e5 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2aa07df139d1e3df7764b05ff95da4dd45812748 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c1d2ded2fa55af744dd5bb5cdcd81fde454b35f6f0c898394e54aa76828d4e46 +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2ee3b0291fac088e9854ed5754e0943de342e59a --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa7c82e29c868ed64a6781f20d60c55bc3dd47b13d9424d5e541743645a8b3b3 +size 199058647 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92be303a3ae91c3831af3676f021622dae84b499 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:91a2a39f919907bb4d7bbc992e9b294b26ca16bc7c3a11865ecbb6629bcec1f3 +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b3df82689dc8e014908a0b28ed050960781baf7f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9613bce86c4e63ed391e84082ae7fe86a70ad783b131a34ab65813c9a24300e8 +size 199058850 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d7ccc6e9aa77a661e61206d5a3c080bb40eedba --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:040def6f4fbe1997b689699c2469422f2d82b8855ff544d8ab834146da97f649 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..748cd61613cc8e99c15c42226546cffb73bc3993 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1741e25fab13ebd55c359b9841628d9b2855705156f2f03f95fe11f989ef29b1 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..75250ae87c36ffbbffee6df799e08d4970a55752 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47bbce1a018e8349a9f04e8ada8dba4cd3abe43666508a9447fd65001dc0193b +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1de87a78fb78a06bec79748ec1c469215b1430c7 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0caee412347791053b9b373393007178dc4201b23a4d877442c7b04f43a2e676 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe5787ea7c90ec2d970d2b209e49ed1a58606804 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4152cb839eb4fe307c9b61861310e6a2dcee7d4c6cd15a4c323938031f2703e2 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3e61f2be19ec4145fbb85504af0425ee205df86e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:070cac0e758beca58004fdf41941114cbafd38acb878bbda9a15505034d2e416 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..999c4534f3d081fcf9d6c4c9724411c203d50f17 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b22297e4045af46a723dacbcdef9676305353653887fe190da1b79e78e1218 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a20b2fb624de26acc6d92927a18a62500250b36 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:621d4e310cf2c6af31f4ac380b2851afba421ba4b1d75de11c2cfa5ba3262d3d +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..eca26f64379435a999eac1281625bf4b4aae31d4 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dfbb2ac9f7e8ddced1f149e5c1572ed098dec7a76b925f5dc6aa9720f9ed4d1d +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..904723f04cd2fcfbff768e553447f38dc1b2976f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ba1774d70fe0724b3c3d0b9feb741ee7bff30b6c6cd5bc7c79a40ffde3795c9 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0909b0b25e383d4323a40ebea4fd67e4e6118b3b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f1a04b7195ff9c2abe01cec65d62a4d2fe494cdddc99e26bdfdfd1ceec2fc9c6 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..511f414e7dc90ec7d67d9ae72ae4f6e850ee405f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26a90509f243810a956f77d6680ca9b547ea8533c6181e27ee02a352ae06aaa4 +size 199058722 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9756b8b9543521318b5c37d0a9700819937cf1b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cdee319d02db24b4ee5057f1e0d6724bd4d33a0863925c2f55e8c3a3db8c109c +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21a53f47773a6281c427c91d9f83c1d0e3813335 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12df1a460ca1c36b1c757ea87a81b6860033b7e5ac697aa2ad7a0d601a459056 +size 199058786 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1199e29a860a13e39845ee2430f45f359628d5ed --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c44f70e0ceeb6372a938d015d392186e20d15abd313b040a4ddbda858b76984c +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7883895b9f2b1fe357ae8d6029b2e92e502c77d8 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66f33c4c0c64028befbf61f0bee11bc36b4676770ea5861a81b844793f4aaaf7 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ded3693ace8ccb0f7351265951e41e8dba88aa50 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9175b375aa7499218a9e04e47e6f58b37714adc60d008e6cbc98073f0070106 +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60dbf3ee93687bade9790ffb61f304aa99e809b8 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c5520589d192788e4d263eae8ab6d43496d2db9206a25185a2896faa2fb6dc +size 199058658 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d53ce545b5ae47b8756c524fdf9633e08edeb7c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e9f788ea28999c3d33538e7167c57cb653c3361b8ee0f21bd0a6628f56b178ca +size 199058839 diff --git a/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2b14c6716ebe9a9468c935938892cadce4abd74c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:41f2099ecca85dc549eced59279d23f141962daf5a6668033cc48b26b0a2dc42 +size 199058839 diff --git a/4b284b6bc4seed3/global_step80108/layer_01-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..50caba143fba7b5f774b087bd9a5b74261bbe715 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56087aba70c808ba807cb225a7b170992b1006d4ecf7ef0d9cb9e3df2df91af3 +size 167511299 diff --git a/4b284b6bc4seed3/global_step80108/layer_01-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbd2e342684e8ba6e95d138580bf2308523dde32 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccca5ef31b66ced91b5d8f981947a3db50875d8e37d75b273eb71629cab11f90 +size 167511299 diff --git a/4b284b6bc4seed3/global_step80108/layer_03-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc4a31505d998f643a10bb6da52fb3baaaf0bd9a --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9b62e904208c776ec13b91780c796ea5be87f0773b6d7e83190170e32fc3dd57 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_03-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..52f82c7c72ed00943661ea6c2a48925c64d2289e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7939771c187ffd57465bff586bcdf18a727d84ecaddcb5797e9db06fe1ad17c1 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_04-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f2fa50ce61b7934680a4dbb243a5cf08a3f6b209 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c321b0cf6a270898e43fd3ed8397eef0d58e8610ed0ddf2d0b3cc804991dd44f +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_04-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c6749bed24cd242f70d85bf9acfc34e693746586 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a3628b7e2629dd5b67ffc3c6113f028a7d2f65f91c654fb52fc25da7901f68d +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_05-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f98d25cbdf7b332ab1763f7a5ef4bd92089ddeab --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6cc8f8eb97a594a0cf66b22630f2d921719e104a6b22e8962e286fee7f598ce0 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_05-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac4e025d4de574f2403bdeed4857b53a55018c39 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c6e3363a8481b54132fe698e42161119924b29e6f70c64c51ff8bedcc0b0945 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_06-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a9d4391403d8b17d363fbab34d8034e5dc8c804c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d612da01523af0b8608f811189a7e5ad530ebee2ff0cda068c94c27d709be35a +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_06-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29f480dae3a39a08d43b35fbf5fa00dd09bbc9b6 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:778d45e1ba7e60e1052bc5be611f62b6048f3a5d30d6fd5396ab63d18b916dcb +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_07-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd0c2fcc2171ea457a2cdc8a78d3999af38ae6af --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7093c636a7107174b86d8f3eb877c830eab123271004b509b7fa8fe5bb400282 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_07-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..add359cbeb86cb984b0d27158e3ec6092a769a80 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c4dd0a94db4693b224c92cf4db0833b0e657609080627375acf568efe9f9d88e +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_08-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..436fcf1871e080ae8daf82b392c0e6e346bd6870 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4d455489dc4c81390864bb5eb9bec67dfeee6eb4811f1f5f9f73cef0a8013641 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_08-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..74d0d833fc93a3656c7d789b70b01e4ca0681e44 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0089be5ffb0d24423a9d3bbb53aac25e597e41d77b5b42ae1ab889f1a7609798 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_09-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9dcd40d3acc9fa5f709e1a4083e04b9a4e32fc5c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac288e98fadc15a622d56bbb9946f34fed6fe929e29f1f0a7ba5b61890aa1ec4 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_09-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a97ef6e8e7d7c6830107c9ce01f55836dd160a9e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56bb38c7f4696416b910b5c92cd03589220dffa3afc6ff78c94ce68fc233d5ee +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_10-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a6dec4eecdf1c6b6f3c7cc979f36d1a36aec2e00 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d3a28d8dea0f6de7a4c55752faf4e0a56be987eea0045cc1052296291b0892 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_10-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..79bbbaea7843a55ab184e9e674ab872a486bcc09 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b3a3d44a0ff475744c505006647dd6705d4b57ed618edc699a92f633b49b0d62 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_11-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1a078c5d212f562f8780c6b1ff9c7007913012b1 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f065df156baec9ec30e0fa6337509cc285eae82120362b186445771fbdc54c6f +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_11-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ba6b21a4d2d1a930e602677b707224157716f76 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e1df2997f97265c1bce4937fa2472812c8bc9d1a7d883f817b0f347292f74082 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_12-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a3f8e72a1919c96f9ebe5b0076312a8da8b5bee3 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fad7bcbbe185ffe570a1dae4c706d5adb3b5897e53696a4ef68f772e6ff2c304 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_12-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1cf0ca2180fab526e2fe1d78b27908202cbeb02b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f8865ea41e4f9ad61573d1b3e8a65efe194f6ce1ab655ffc0778716ed45b0fd3 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_13-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51e358609461e4f246f3c2a1d98547dbddac474f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:679d83c8ded279f058629aa266deb7d148f831301fab6a16914702fb432348d4 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_13-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..859844b11f4e17dba28fed802747792be308035d --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:738f6d8b404bded3c862cd65de81ecb6e69249ca7bcc4b5d10cddae3fca0119e +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_14-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d67ba6c939dc64bb139313b9bfa7ab465fba02c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a53674005fdc45f57acd12b6665675e2d236e8ec01c2e5f441bf79fcda7df1ea +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_14-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..214bdbee003defbf072775005f88e0818c154007 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8196c250ce825b181b7fd04ff8408a8b4328a3f8e7c176ff7be87752ec4406e9 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_15-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..428c47b53cd4dcb42f78fdcf5ed4f0075ef25411 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c1fb86f18656eb5774922cca712eab8f9c161fe702bbd4b856b88c1875cf218 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_15-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4becd573f5f63161cdd3bf316d88681cfe2b2a2f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3977f132e88bd5ab87a1596aa7e3d6556f4587789d42918c66a89e4a0e8a5302 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_16-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac3174e787ad036ae8ee3668c2ac3ab83eac9a15 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3641759aa840aebfe6231d3e1785739b049be958815a63d053e5b64ba0e15b16 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_16-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d8bb8c13d651b1800ce2b5a9ab587bc9ef149721 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df402d8d3fec7cea2cdfd4a11702362d5406a734719c7fccf6dacb7e418a738b +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_17-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..983d24e9f53994c065b6084a397d6f6254518257 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d0aa7307b489a59748cda1bd15a914ea218bc81a7221a19ecf83e6ead7c0d40b +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_17-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de5ffddb1189475983f0fe96426b1cffc2b0e028 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d23fe38154d74abb07aecd233534836b2b01c0dd1eb5474d7232e2156d9021bc +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_18-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f61c9f2b0a5d885df39783f60962d280175697c8 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44d8006b68d29d7867280f08155ad5427b09f28c60332a8a90aa5e0ae8eeb809 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_18-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..430c665f67974e44acab58cbb00b4936a3aca128 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3025888e913886723c792d68e5302b3ac38de5b5d85289a5afab0f874eb549fc +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_19-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..85865e71402abbf505b77dda19e6316cb6fb92fd --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:48464a71d1d81ce62bab20e3d786a8993e4bd23916bcc4555f5ce3b8c8214c6a +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_19-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77f567e90f294a16121cc38608c66a19e6a978aa --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0284df88089d7e5f57032cd7736b6317ead08e757334682a2563f6a065470523 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_20-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41e42970a73df642f40f2e7b56a66ddd1efb1082 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c8b928d79257b3a0f01a970996566907b50dcb4f530b004fc00547bbdbce792 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_20-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe2601e0aeed092466b3ac77f56c36b5c4e61c50 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b245d49faceb154716378e8499fce7e1efcd2002ac79d9ea067430d243d7382d +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_21-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..24f96fdb9e08b37351ed8a6542ffc18732d93d1b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56d765ab5273ad967af7c741671320e8d01c0de8f419558394382588ecb37eb2 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_21-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b79b5a5ff8566034ddbbcc0905386540479a2526 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc22763dd331fa8898190ec99fca12a6cd951d963246dba4ebd921d0dca5b9d7 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_22-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94bbdd62b62b3b45290395f8d781e7265980924f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:77331d052aee0b12972179fe838bc99c3b6ef6628df62b9820ff754645c15e32 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_22-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9015b8aec6d2f6cc22a71534dc16532a3451dfa5 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c31abfe1efccfb6f80f8c1a04f536c940db584b753e22eff617a5302f59d23e +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_23-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..921eabf214de97907c56fe09c847db624ee6fa9f --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1a7fafd0ea241d48c1ae3cfd38191b61114f78d31c6d54579efc59ffc74b6e1 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_23-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..975d986d020632a1adb5f9eb984d897d1781be35 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:744202fd1ebbde3909b0258ebd4ea9ed9292e1c88e548d3e8494179d280d1ae0 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_24-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e0856903eeb36ee6daf6d512d99c67e2fa3862e --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ece233b49ee9d4ccdf48c60ca25ae513194606119ad2c813d4c345576ae0e25 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_24-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d0c7ae8f2c540622984b434d4f3e4fab6a87249c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe1432ababeb50bc87b6b4592822db0cac65a2a5a82dd8bee14045a1ec1ac3cb +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_25-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1b4877f03df08e23b129b46d37c0d78d524b95ee --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a7d45da212204e60ec12c106269290e8242e83cd593c329f3fe8664d4e87c8e +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_25-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbaf266d1fa0af17bf68b726c48b834af77c69a4 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9efd53ba5c2a4048000db5028a6ee089a710eb91bd46b503a0a26c4ad16bc0bb +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_26-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4b5b5a575a9a181eeb5462da2409be6ee077b484 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15960401c5c03c2837b6192d358e21f5a72a00eb7c7fbc0a9d27535513192548 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_26-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d544bedd8e77834d7c34556665c66c7ee209f2d --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29227bb2d61e5afaf0deb12ac8c32ea5e64a17cb3ab7d3f23c0ce5befabddf34 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_27-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1d9ffb00b428fee3c5a13b8ef66d775fd95c0cc2 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3d54a487a3143443616e5c21b3b2b626b283fdea02232d1d57b543e7307499a +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_27-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dc4ea0696776e2079f30a9ae02afcffec8b50154 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:55bd19d44ea9cb25e1c1fdcfeb34381d66ecb8d3152d4e732454a179af3a4d7b +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_28-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..249ecb2c00be280c2a9ebf874aa239537d31267c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a00431a202e7f6bd51dcfd8ba4867ad41c95369a80558563288c5fa2239f2576 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_28-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f4ae7e137671e9000421b102acbe5e92be40566 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b43316919cb5dc9ba864578fe78b4ad596e87953ec651d777f5f20238a6d615 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_29-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4f55fae83c566ba45f5c0c61ee85de963640137b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:04db35a14c1862c161efd327abbcea7f557b6ec6362fbfdf9f77ab7f239c4a7e +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_29-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..625661a6424101ca3c2a2b27ff7634e4606163e7 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b384e618c871fb15e980f1278690d33ad6693782a72c82e347d0d2e02ed8b780 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_30-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d59bcef86a767252e1ea54313a44a2aab8f95826 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0404a638deffb8740a2fa4104d8605c4bd7a50afdbf15dbd8405ed6c6b8e5885 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_30-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c98367db087bb88870c10ae124dde5e7c40554a8 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1e55f89153d504c6c3d45d556c0c85796a1115d11d289f987f1b1ac5b2b55ec +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_31-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c7b03dacc7ca9d9f7832da7b4dda9fd561714f9 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4922ec7c8f5ace2de82a2e1dbf850ded5457cc8c646b4ce9fe79425427b2f7a0 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_31-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..704b0613e69dcc2e8cc23edf5baf8e63ee0f8417 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a147039b31f4ef6ed11c6415b3ba95e9b99cdd27e540b95c129805d331ee616 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_32-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2f611b719b2eea269451393a5b81b69f876aebcd --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c8e1c6248e3450d619938fbbf270cdbfd4fc14874ed2129a3b0fea50658050d +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_32-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..400983846163a9ee96858ba93ff467edc802d7a3 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ffd6afad37742ee42067a88791c81de0ba7dc1a3d9a6525ed0c564d93bfa4ce +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_33-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3150d8cd0344209ad110c90bb3eb4944450dde31 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54d9e519fba5c8a01263ccfd4ca7105c43abad791ac7ee686f08be39f3da921a +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_33-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..528fa633b0eca5711ef5ba80931c74c26efeb660 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:50412381057e1f3aaeff0edbc47bed0b75b82593afc1c8ef63426db893b14a87 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_34-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac071f7fb34e3c61767e0e7e044e313e2bcfd60c --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ad84e826955cabd6ca1adfbe3764fc4b81995322e94a536f10a032145d28db8b +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_34-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7eea1741f772e6c518033e2660de74f503494e9 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2a5fea2c6b0c5d8edf90d308718507496d9cea9475b5ff0e99daea4b17e1ed44 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_35-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f61f2513cfea08c0d0b62e442e05709f6762d860 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6f4c065ca8b4a3c092a4c63b06d0670849e79cabe3315c8f5d7c51cee4f1d4c8 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_35-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dce8596b731131dded09d727577079df3db1b5a --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8333ea37f994594638fd511dea149f5a7704ac27beb5c6f081206d082c2e99d +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_36-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb4198ed04268db2958f72dc0247ba5b36300da0 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d42742831e4636e064355cc1d2c50a4724decba97e811983a6e1255a11be2fde +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_36-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c21f8d84c6d71b171de560872e34f3da493a11a8 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:71b3a68993aadda8b45ddd7316a985f7057c400de4c1381789f13c625ea75fb4 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_37-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56254d2f36f78fb4545e81c5b89e4535b5afe346 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:774f5fa9c2cee1fd9d7fd640f62f9928f8eca3c2ca0d0fe1030b84eaeaa80896 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_37-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cf6c82ab97f9fd8e6df184c92fba18038549454 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:66567c1a4ac178cef4177500fbf6fc0ade4fcb0aaefeb8cf593a51929b179029 +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_38-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..547babd8a081e8cf9323c871edb4f762fe1da95b --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d5e6bc4450bb73cc66cf1b6cd88ba131b3e54c15ee4d08c63d7982acb657a2c +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_38-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1eb6327eff5d9b612cf78fee030d434441e9ae29 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ff4c999da03192805313cbaf161e014e3a146f3df6eabb82eca29d2c1a54839e +size 113308931 diff --git a/4b284b6bc4seed3/global_step80108/layer_40-model_00-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..233378080a4835652bd97dd9966fe8ac7e898340 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:492cd132ab96de685f1980aec42278db4ed9b43482d5d1fc25430dd5902ee9b7 +size 13507 diff --git a/4b284b6bc4seed3/global_step80108/layer_40-model_01-model_states.pt b/4b284b6bc4seed3/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..061a1814f83ed16d4481faaa460db18820641ba5 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:474c8581c45b2b84df9d9d94a2dbc4db06fbbaa911f094067addfbc331cc4f2a +size 13507 diff --git a/4b284b6bc4seed3/global_step80108/mp_rank_00_model_states.pt b/4b284b6bc4seed3/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f4f45daf9105a7d21c48c61c802c6bd34792d594 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d9cba1e093f5ad96d7feb1caa9394817dc48794d04af4bf8268baf6f95454cb +size 51443 diff --git a/4b284b6bc4seed3/global_step80108/mp_rank_01_model_states.pt b/4b284b6bc4seed3/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..437ac20203e28143dd9bc2b0087195953e516265 --- /dev/null +++ b/4b284b6bc4seed3/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd6825d6396006274c134fd8e118d161ddd65e8527d32156460bdbdd35715fbf +size 51443 diff --git a/4b284b6bc4seed3/transformers/config.json b/4b284b6bc4seed3/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b6bc4seed3/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b6bc4seed3/transformers/pytorch_model.bin b/4b284b6bc4seed3/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..4b2d0a2d9be1dd8231bb2e0823fd54e84179bbf0 --- /dev/null +++ b/4b284b6bc4seed3/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:faf6c95c65240af0a5930f30cbf52bda8049937e8950285ffe94a09ed057e946 +size 8781203669 diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..b533eda88faf2d00015a02fc4646a939739f8af1 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.35166211431807476, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.038071413053652275}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.06996455274792455, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0015592090868851113}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3142067124043025, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0048759710824468425}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1064177979826906, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002014407824130901}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0322534557054686, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009291159250523059}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.15163416252366027, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003394361327422675}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.04977759217169638, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012651503383739272}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.0665503328402659, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014349991462073507}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.30272317644546903, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004757737332652531}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.10151875678161845, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018675156066895481}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.06618311419871553, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014716875527080561}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.29700852030137187, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004591273606148228}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1005468816321386, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018871768805081306}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..beaf6e88f175d00569cd25fa4b9cee25cf4b1d7f --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5073000336177755, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05344474459205947}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07583504538763819, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001486787446354916}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.3716954850162639, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005205035164096044}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.11830423680079659, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020114505178455027}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03495776879514267, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009075777652215385}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.17885977259906066, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003619881028179333}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.0546051702795999, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012569436349181779}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07030089422838176, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001298347917395423}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.34696500909784356, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.00482360237080409}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1099788832885831, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017852180819479216}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07122182052038024, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013897967007664056}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3477576171750515, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0047659276141866136}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1110119989726, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018755811955381053}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..560c8e09b3ce99a7bdf9261e0135932b628ae0bc --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.5965263236594742, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05163954961828016}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07783318626900966, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014071193338354882}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.39287654613370876, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005155876341027884}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12233537069614382, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0019128091926460928}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.0354373968856108, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008545023435501012}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.19039459495393043, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003663120720639406}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05592276690064219, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001197562574066807}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07188967304527148, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012421548275795777}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3648630199526146, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004750553642386819}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11320053656812012, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001703639135984389}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07268380811649039, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0012997045865083563}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.36691870218506767, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004689100059731652}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1142026340807714, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017614419186672153}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..87ec8bf46d378b237c61d5f82d721c4ea69badfa --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6590445507565462, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.03731228606768085}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.07980698513957299, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00144116669925528}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.40871250304941253, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005277184107543118}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.1255592398663772, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018984572804718245}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.036737647094888005, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009490563555727562}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.2012500620682874, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.003837876814963123}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05799188686736059, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012470877418224642}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07344239380035893, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001301053396600686}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.37652823939289803, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0048219321223642725}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11563164980687576, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017088580020787614}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07446732582003722, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013512166475080024}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.37983284753458935, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004768406523815667}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.1170142277810441, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017619775635762797}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..da227b3da1ddf510bf857b9c9aa44ae62acd48c9 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.6612094103636722, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.05316688615822092}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.0814867015244332, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.00140335178133597}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.41970698412830326, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005264636607062869}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12810389443498593, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018474124639315977}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.03716974645311799, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.000858671949423613}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.20569650614003127, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0037797450322498744}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05856459210667893, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011483796934916865}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07414197510231946, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012218676591713073}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.3844479540779492, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004824012642018971}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.11674639728784307, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016142840608080332}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07570666678042967, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013105985925116346}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.3891045320252018, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004752985303492144}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11883717065008154, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017051707976467297}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d41f685273a3823eb69134ebb67239c35ec628df --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "bleu": 0.7275241684724033, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.025139024300557544}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_precision": 0.08119001231813255, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0014308370032712263}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_recall": 0.42544190008314364, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.005347650585072293}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge1_fmeasure": 0.12807283189555618, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018561044445990925}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_precision": 0.037488476057553025, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009127843819336664}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_recall": 0.21034382299607524, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0038365434728806005}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rouge2_fmeasure": 0.05924660282751187, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0011837956870791252}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_precision": 0.07373330048793485, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0012777957450006742}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_recall": 0.38841487576118355, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.004859412970167045}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeL_fmeasure": 0.1163811957107418, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016389675453477302}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_precision": 0.07528625093598806, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0013390502316204457}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_recall": 0.39421410712837596, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.004856189403160334}, {"task_name": "GEM/web_nlg_en", "prompt_name": "PALM_prompt", "rougeLsum_fmeasure": 0.11860693664537329, "fixed_answer_choice_list": null, "dataset_path": "GEM/web_nlg", "dataset_name": "en", "subset": null, "prompt_id": "3e41305c-5461-4cf3-853d-8a6fb5747623", "prompt_jinja": "I will verbalize an abstract representation of a sentence in natural language. To do so, I will first show the representation and then the natural language. The text needs to include all of the information in the representation.\n\n{{input | join(\", \")}} {% for i in references %}\n ||| {{ i }} \n{% endfor %}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017120447774363115}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..42e169dcfd93a37dfba3097b5557ea9e245cb5c2 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.15946778937891515, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0019263515035577486}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.2715850357160657, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027017071210897574}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.18622713587913528, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018412460647723918}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03438888805377945, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008080459258315309}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06117675765752758, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015061198705940962}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.040460580826441606, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0008960319674160765}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.12211228339854341, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013298965520439228}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21625650856608786, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0022314529211675395}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14446880136361956, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013159464984661877}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1467045219684518, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0017626659229341545}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.25116019588094557, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025177140997767675}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1716160186471173, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0016894452306051078}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 1.8709275972877584, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.058898637546592025}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..122e09bea227bfdeea37825c6a9aa8d5a54aedfe --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.17861978084436733, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021557050699636633}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.29492911982793857, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0027364010294303274}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.2051454909041775, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.001963503184239578}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.04216196051123768, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009857371725593724}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.06892249984818269, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015097658330848196}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.047516585339244355, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009726713638331002}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.1277101470262864, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014839765534000772}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.21755280146548553, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0021188768570991334}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.14783021982665137, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.00133667062385201}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.16764488030279848, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002021292385911164}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2778932641853077, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025900462140142086}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.1927127973435724, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0018361383918979964}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.3540646113466352, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.058383312223254456}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..83c720d3dc7443fad671316195f725c5b7024eda --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1867354040241945, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0021764534616989487}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.307356685382873, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002668787558898061}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.2125892107712728, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0018726113691632032}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.044945343265659306, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010090897572849198}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.07429122479757874, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0015703671923323263}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.05037415373416898, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0009688792622757568}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.13207273293373048, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015334022424691339}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.22372031586233712, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002107048468174928}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.15111305737547598, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0012722677867412764}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.1758960740764525, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0020592289423643946}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2900411283233057, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025253027294766133}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.20022450371280426, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017542714847597852}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.5117616289013234, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.07882958513520422}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..a652edff92b0568348dcd74a216ed31f6ca782e6 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.1591881844404937, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0024467695339504187}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.25516734786727036, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0032356801874518703}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.17575906704306832, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002174949765654744}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.03784379091188361, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001089131871792838}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.0624780077769272, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0016087440931355302}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.0413255105224322, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.000931832765467482}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.11442394801240031, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0018112801572746817}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.18773348293405673, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002527108820020842}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.12628359782789042, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0015182895930992903}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.14968568215454517, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002308127867301231}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.2408810647537952, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0030822171919214422}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.16530823720647217, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020367190470455404}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 2.403113898933743, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.053251073858493}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..023e10d7815e986f14017903817ed20cea941faf --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.052405749034228705, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0020110499867171685}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.08478707705138788, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028865777805548412}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.0557867591334426, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.00186394804170534}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.011080419003140766, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0006523070791806857}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.01999068467854864, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001096551185475821}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.012185104729686681, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0005907016058266906}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.03862877667774788, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014997122070137985}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.0641687643508006, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002226474813987104}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.04111644120483341, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0013476527639030426}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.04914657123032221, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018810939013272998}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.07980206255787106, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0027207315430338498}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.052305917688342855, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0017400550554708667}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 0.472345677088637, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.040900356286228075}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..3ef33935f5d9341c7bf62d740f4e50ba8fda195b --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_precision": 0.008509363653553257, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.000845658818252671}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_recall": 0.01382276652509776, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0013334225811003739}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge1_fmeasure": 0.00898341548277317, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0008281424457556686}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_precision": 0.0019932915366697277, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0002440516250439588}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_recall": 0.004040972091745142, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0006014270152725088}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rouge2_fmeasure": 0.002227060333018499, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0002638537239607946}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_precision": 0.006364757119046798, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0006395473026447492}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_recall": 0.010409531448448452, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010327387282074423}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeL_fmeasure": 0.006634289847575651, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0006061194677904214}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_precision": 0.00802904222397337, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007953313177037809}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_recall": 0.013136908473646484, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0012773726821035238}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "rougeLsum_fmeasure": 0.008483394098012836, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0007802466552819305}, {"task_name": "GEM/wiki_lingua_en", "prompt_name": "tldr_en", "bleu": 6.538062149513937e-07, "fixed_answer_choice_list": null, "dataset_path": "GEM/wiki_lingua", "dataset_name": "en", "subset": null, "prompt_id": "d3c5baa3-5e37-46f8-b1b2-5b834181c9da", "prompt_jinja": "{{source}}\n\nTL;DR in English: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 1.1494813563989744e-06}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..081b003688307e06132703679ba8bf05a54c55f7 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 0.20344702036475212, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.020813423545746928}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.02031066874429793, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0010982973394100017}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.0339006777431073, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0010754582360608094}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.02272612382623739, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.000657613160095564}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.004428962002328776, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0010133668145643837}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.0032484488515415436, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.00039041664574734875}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.0021610970637232323, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.00025014704785064965}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.02023890948503867, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001094108815755343}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.03378068019453833, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0010619663136781138}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.022638837838076648, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.000646894021986954}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.019207655955704183, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0010760427436256133}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.03164987205173273, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0009558614487519096}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.021275240072120734, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0005850724780177193}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..25fb989c0c4b84ffd8ab051e513247b5045c56cc --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 6.931679880377635, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12521222343600627}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.34003150968688334, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.003075339331446666}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.45015732570626815, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0028997064403193467}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.35867604679541404, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0022242609651642654}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.14759589015368266, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.002060777542304401}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.1951244486489613, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020953412261598093}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.15367455208735437, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016232409779530833}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.25480483800873843, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0023341935238719103}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3465181251792575, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0024646626498150185}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2708573841017006, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016414160973280045}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2799685955963331, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0028032299642029843}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3677356916274029, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026996771832412166}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.29387614768355197, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021153745644870423}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..55213dcdf62fae70e0aa71f365a3e87d12dc570b --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 7.657232828965316, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12471874140369284}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.35675768591806567, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0031022663155459203}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.46937017367708633, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00275346130622528}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.3776586411733957, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002198646985806164}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.16231756057946886, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0020395417907086693}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2138289664047894, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020707270316515283}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.17010386224275442, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016283471019571314}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.26310458036396617, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002272981131996748}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35664473399252883, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023940807408273975}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.28123834488197835, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016069446891559397}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.2914642398591572, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.002757164859310039}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3829945698750505, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026117917187163785}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.30825756247609604, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020874241622850045}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..cdf95f7c2c8e212cb59dc92b22b08eae4787e01e --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 8.442104172996691, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1225265310989897}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.37510123434341147, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0029659588823890727}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.47688116434271155, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002779761613350503}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.39418201029816835, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0021766899975066423}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.1722185872161438, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001982108880961337}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.22148343783169197, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0021298024706319753}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.18042060590724515, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016663829828460059}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2708367244008351, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002174690044000994}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.35404771153503223, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002443187318628693}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.2871477669735601, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016369768534961649}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.30935204172558023, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0026977427492078823}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3923447311858455, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0026716176658316635}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3246521112217336, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.002119544362824107}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..05f1f04d2204829ecc0548ec99e257c6db2a228f --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.264771481612339, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14797632752636197}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.3925987211674676, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0026976461573692354}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.47354063069748037, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0026338292343196816}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4086207638030011, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020852610120524026}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.1796234616071412, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0018685574967649593}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2190905542412407, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002068607728271308}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.18703841259223752, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0016890429531878357}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2819581010790434, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.002044363363394681}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.346344258787895, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0023161012828013965}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.29515772076134655, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0016661150684501613}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.32521791939739797, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0025320061675288244}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.3913010253854303, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025849947764755407}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.3382507422373424, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0021124639320887124}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..e689fc4bd3d18c770b2aa42344f8a332e9bfe6b4 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "bleu": 9.958980611111656, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.14855771135694565}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_precision": 0.4061514037393209, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0025821552864821757}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_recall": 0.47804480569363766, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.002643357770719704}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge1_fmeasure": 0.4197228631027415, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0020063425382385058}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_precision": 0.18757831560333757, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.001891660346486441}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_recall": 0.2218502429628836, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0020386307840161645}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rouge2_fmeasure": 0.1931509426359425, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.001665707134510459}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_precision": 0.2911232268001962, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0020806579815607195}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_recall": 0.3466822060660839, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.002329148139407088}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeL_fmeasure": 0.3017298916186032, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017018141577312348}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_precision": 0.33992936633595283, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0024759755832926282}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_recall": 0.39927240691403565, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0025795756365194628}, {"task_name": "e2e_nlg_cleaned", "prompt_name": "generate_text_restaurant", "rougeLsum_fmeasure": 0.35086688827184365, "fixed_answer_choice_list": null, "dataset_path": "e2e_nlg_cleaned", "dataset_name": null, "subset": null, "prompt_id": "1acabbc3-c9b9-4624-a684-29faeccff46f", "prompt_jinja": "Given the following data about a restaurant:\n{% for feature in meaning_representation.split(\"]\") %} {% set key = feature.split(\"[\")[0].replace(\",\",\"\") %} {% set value = feature.replace(\",\",\"\").replace(key+\"[\", '''') %}\n{% if value != \"\" %} {{key}} : {{value}} {% endif %}\n{%- endfor %}\nGenerate some text about this restaurant. ||| {{human_reference}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020482132353444454}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_0.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..3329e2531c211574bd0560ccd4a84eaf653c289d --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.14717191874948962, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002039989999763031}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.34130886710278735, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004109809014072106}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.20091233893732696, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002460990636185999}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.031180276988501406, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0011515924925153934}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.0750546362679565, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002664189585730598}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.04296352475719179, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0015091336137169667}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.11187209453346593, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0015620035707168242}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.26167076851220833, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0032523973074039445}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.15294193870162445, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018589320642533784}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.11548986592851035, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0016848405957502828}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.27023318122685785, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035574900499767722}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.15798602735496012, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020505297987330412}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.7847107445080181, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12259281036544756}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 0, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_1.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..5429336a2c5437d19e73e83024eb734af77476ad --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12097137240313847, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017496349490089252}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.2990148200796171, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003991241961142267}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17024912689462188, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0023476916428796877}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.021525610014554653, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009005470188155159}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.055447375013310755, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002401181861336932}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.030605161726994057, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012798169612394362}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09373642633960022, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.001306812474264428}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23409871583030145, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0031894294773192737}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13223813090153158, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0017763582648502928}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.0978239478590475, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014318544124746646}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24391576493442443, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0034515787165719444}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13796987863879345, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019475228863655185}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.1845032944798495, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.08458246586222135}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 1, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_2.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..c0a2062996e25e28284b756f96edea10a67f7a1a --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.12153696089604207, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.0017564783405385376}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.30200065000392107, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.004133147911453231}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.17123176762196604, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002367991688636443}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.022397648703525567, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0008966352941752963}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05865756100278522, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.002417706489905652}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03194665621464301, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012704379487708378}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09454924200528139, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0013285980685601034}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.23705948565261042, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033238074174046623}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.13347870518175978, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.001810460575841908}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09773827044948902, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0014279562335011396}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.24540888083433957, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0035863376843111756}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13805797792168725, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019538992181766693}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.235087762721956, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.12954971142620794}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 2, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_3.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..057e59934e68e8d1f6baafa9e94c78275803010e --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.11912123096636808, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.001985064027306789}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.284241972897382, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.00429277701738966}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.1640154958358604, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0025105121490214565}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.022035764094734074, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0009495941851705396}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.05485929060591564, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0023528230640158182}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.03073680556060331, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0012970855907124138}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.09256740744943301, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0014688063331016958}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.2237667779749703, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0033868663103060566}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.12797306233278474, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0018874238035470816}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.09452589861322153, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0015705338179864972}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.22814994714493522, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0036128044767980974}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.13064448950535576, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0020334528859491884}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.2530842896627028, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.1292510298416823}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 3, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_4.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..97dd360ecbccd8f9ecbdfdc24dd67ffaebb9583a --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.036060956179475516, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.002146455590056505}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.0690610482890532, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.003982103092460407}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.04359155004979404, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.002446009970548131}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.00544898809262409, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.0005451635252349526}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.012376718286934233, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.001258378038487793}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.007201974037466402, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0006993387361055898}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.02859153283892875, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.0017520581139644556}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0540675976921445, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0031205628190529014}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.034064899256478404, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0019036508052699063}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.02946392180089849, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0018091240355730465}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.05579499878286511, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.0032320807958250114}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.035141373500357204, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.0019687859509567853}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 0.5139598974348316, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 0.11912575032590099}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 4, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_5.json b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..53eff017bec901db766fff4f05ee561431dedd18 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/agg.4b284b6bc4seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1 @@ +{"results": [{"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_precision": 0.00304016734736987, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_precision_stderr": 0.000888339058787168}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_recall": 0.002441151228222129, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_recall_stderr": 0.0006688844091459975}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge1_fmeasure": 0.0026631982951325368, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge1_fmeasure_stderr": 0.0007488447516617362}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_precision": 0.0005433276798426632, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_precision_stderr": 0.00039244433049951473}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_recall": 0.00033315740862910673, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_recall_stderr": 0.0002365408622759455}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rouge2_fmeasure": 0.00041201488569909625, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rouge2_fmeasure_stderr": 0.0002949309636685756}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_precision": 0.002191679085043183, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_precision_stderr": 0.000685805567529641}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_recall": 0.0017718084851004953, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_recall_stderr": 0.0005070173978560121}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeL_fmeasure": 0.0019214818091001502, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeL_fmeasure_stderr": 0.0005698678616813168}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_precision": 0.002284463934531111, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_precision_stderr": 0.0007267983753519665}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_recall": 0.0018384573787288605, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_recall_stderr": 0.000531115868075893}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "rougeLsum_fmeasure": 0.001998668773079567, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "rougeLsum_fmeasure_stderr": 0.000600651825136055}, {"task_name": "gem_xsum", "prompt_name": "article_DOC_summary", "bleu": 1.5223289746048162e-36, "fixed_answer_choice_list": null, "dataset_path": "GEM/xsum", "dataset_name": null, "subset": "", "prompt_id": "a8d4ecfa-c944-44d5-878c-04fd5db59e64", "prompt_jinja": "Article: {{document}}\n\nSummary: ||| {{target}}", "prompt_original_task": true, "comment": "", "bleu_stderr": 3.669632606867041e-32}], "config": {"model": "hf-causal", "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", "task_args": "", "num_fewshot": 5, "batch_size": 16, "device": "cuda", "use_cache": false, "limit": 3000, "bootstrap_iters": 10, "seed": 1234}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e47bc8fed939487d5e853a01cc08ba057cc5abea --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:00482a473bca594121cd0d50d940ce8f98c053443dc8c7d068e6c09be51941aa +size 4160610 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2245f8768ce290de90cfd551db494f88cf86c6ac --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:224195a2f5c0dacc2ede1c393bebb4f3eee63f301a09933a007408328bd76b81 +size 5111698 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..59cb2eb99d914e39768438ff60f66aa0719770af --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6ff11b34d982cd52a50477dc1c6797a9942d66b083cd81363ea1fe5fb1ff501d +size 6008523 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..794b846425c0bf0effcf1faeecc2f360b5607772 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:533dcd05160ae2d4c3fb6c72a96175f71cc857864bb7ae4d2614070dae0013f9 +size 6897287 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..44a9f38089fbd0ea0ea1d7d85c4ba5dfa2d9312a --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9c93af68e2c58f79b9bd3a64f233824228b68b3341fb22dd7faea96f7a4ffb1b +size 7806812 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..1afdd59736f1b961df9b0ee1ed8b6015153b25e7 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d7a9cc90fe3ae4f43e71058587aef00bf2ba5cc0c805faf3a9aa5e586d965ad +size 8712138 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..454fd78c081f1fcb44ca9b17b49b86ebd4183c97 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7937268a7c4edd2cf777ebfac57b683289a4cb76e6d1541a36513978a24354ca +size 7692596 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..a4b50ab0d10bf0ba03e03da43a702617ddd9e43e --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f71bd250177497a432254e91a21d500785bbd74296299e31e71486f6d5b4ad4f +size 13300240 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..728d322ba1e16c65f27c52d552e6d825a0feb868 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6c83e7bc8d7fb093c7f672787f1bb298318a36b76606be05e8e7076ac09a8702 +size 18906277 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..49c380d8af251a811a5cc12c2f97b756981b5fac --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc5aa812ff71b969c5a35bba93333da2106f94b4f36fcfea5eddc37547967d36 +size 24334926 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..2c58bbea6ead8538b05635d194d49f2fdf8a3ccc --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:849407ce3ddec0cd2aa2b404d423d908636f4a439b8fec7d9178e1b4d367af8c +size 29475902 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..cdc5dedda6aa4bf12e5ba12f329d5169f37d6ac3 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b0c1cddf9af3e174270db464e21e89cb535d001db32657bf3f8b597a0d6a2680 +size 34800652 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..dc9ddc85ae95dbc6d2ccd0b79be7470968f01766 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:308ce1b7b3b0a97ac3c9bdb7035859d0bc524069c09decaaf6acd72e73e5c859 +size 4511873 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..e61ad4a9b96d7c6d09859495f208bd537edbd3de --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a06f9d452b6c36da1e96902fc893b46b7b31c1026cadeb402b0e375253e7e807 +size 5337940 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..73fe35bf1f74856a6dde308722a194c9c78017d1 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eef4bb472d883072216c2963d206ade366463e99dc36efc5528895baf79473a8 +size 6416422 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..245daf5fdda3aa27f92ea3a60df5f4ea483e07d8 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa24d347a4fc3d41d7f5d3bd6c9d7fe9b10c442231360d552bff09efb359fa03 +size 7461416 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..6235402b4b8a5b98a549e30e9079bfaef84f07df --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f2084d730232df2d21f4944d5b02a1ed5eff7b606789fdb85c9355684aacb41 +size 8489390 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..5b85bbe388a47d0b0fd339480c0382a1323a55f6 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:96a2e0562fa6566adcc1edae3f32775d70128be8eef7aa24945424b5bcac77ad +size 9551131 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_0.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_0.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..9389ffbf5a6c8c39d4b764a01b930f5ce44e3f21 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_0.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d19547805906b85054c29cc9470371cb0fac908ffc245843722eaee11e74bd47 +size 2823947 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_1.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_1.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..02dbbd3dd2c435966d6361a3c5eb9912ba932723 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_1.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc29cdc110d5f0e5c8f651b92a9782a2811f8064997a4d5f4e0209e88a4cd62b +size 5102888 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_2.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_2.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..92d377e52868fc5db71b544edfc2ebaf76b897b9 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_2.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7780fcf5e1a89b998671c4bf0e645c2249088e25e847a2fedd2834c456dec71f +size 7376534 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_3.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_3.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..4dc62c9fbde051f86d0002146fb7fe962a1fda81 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_3.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a200dd1df18dfa96b5579cd37dc5ff29d95f7d62ab03bd9f28aa716cd2713571 +size 9645679 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_4.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_4.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..882a6830d53ec2ef8f0389d017a01a4ff0410e63 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_4.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0de588162844abc5708ee182120b3ca1877ede0177b06959513b3cd7929ec897 +size 11672188 diff --git a/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_5.jsonl b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_5.jsonl new file mode 100644 index 0000000000000000000000000000000000000000..85abb6b94bef568aea33f27d4bd5cc2ab760bd8b --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/examples.4b284b6bc4seed4_gem_xsum_article_DOC_summary_5.jsonl @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:906ebb32b15799ca479f521359b9d245a266effd3d255a7b1de8477b5b21a0ea +size 13897624 diff --git a/4b284b6bc4seed4/evaluation/generation/merged.csv b/4b284b6bc4seed4/evaluation/generation/merged.csv new file mode 100644 index 0000000000000000000000000000000000000000..bd00e9c010aab56fdd43fca4686eec6c3b608bc5 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/merged.csv @@ -0,0 +1,53 @@ +dataset,fewshots,prompt,metric,value +e2e_nlg_cleaned,0,generate_text_restaurant,rouge2_fmeasure,0.0021610970637232323 +e2e_nlg_cleaned,0,median,rouge2_fmeasure,0.0021610970637232323 +e2e_nlg_cleaned,1,generate_text_restaurant,rouge2_fmeasure,0.15367455208735437 +e2e_nlg_cleaned,1,median,rouge2_fmeasure,0.15367455208735437 +e2e_nlg_cleaned,2,generate_text_restaurant,rouge2_fmeasure,0.17010386224275442 +e2e_nlg_cleaned,2,median,rouge2_fmeasure,0.17010386224275442 +e2e_nlg_cleaned,3,generate_text_restaurant,rouge2_fmeasure,0.18042060590724515 +e2e_nlg_cleaned,3,median,rouge2_fmeasure,0.18042060590724515 +e2e_nlg_cleaned,4,generate_text_restaurant,rouge2_fmeasure,0.18703841259223752 +e2e_nlg_cleaned,4,median,rouge2_fmeasure,0.18703841259223752 +e2e_nlg_cleaned,5,generate_text_restaurant,rouge2_fmeasure,0.1931509426359425 +e2e_nlg_cleaned,5,median,rouge2_fmeasure,0.1931509426359425 +e2e_nlg_cleaned,5,average,multiple,0.14775824542154287 +gem_xsum,0,article_DOC_summary,rouge2_fmeasure,0.04296352475719179 +gem_xsum,0,median,rouge2_fmeasure,0.04296352475719179 +gem_xsum,1,article_DOC_summary,rouge2_fmeasure,0.030605161726994057 +gem_xsum,1,median,rouge2_fmeasure,0.030605161726994057 +gem_xsum,2,article_DOC_summary,rouge2_fmeasure,0.03194665621464301 +gem_xsum,2,median,rouge2_fmeasure,0.03194665621464301 +gem_xsum,3,article_DOC_summary,rouge2_fmeasure,0.03073680556060331 +gem_xsum,3,median,rouge2_fmeasure,0.03073680556060331 +gem_xsum,4,article_DOC_summary,rouge2_fmeasure,0.007201974037466402 +gem_xsum,4,median,rouge2_fmeasure,0.007201974037466402 +gem_xsum,5,article_DOC_summary,rouge2_fmeasure,0.00041201488569909625 +gem_xsum,5,median,rouge2_fmeasure,0.00041201488569909625 +gem_xsum,5,average,multiple,0.023977689530432944 +web_nlg_en,0,PALM_prompt,rouge2_fmeasure,0.04977759217169638 +web_nlg_en,0,median,rouge2_fmeasure,0.04977759217169638 +web_nlg_en,1,PALM_prompt,rouge2_fmeasure,0.0546051702795999 +web_nlg_en,1,median,rouge2_fmeasure,0.0546051702795999 +web_nlg_en,2,PALM_prompt,rouge2_fmeasure,0.05592276690064219 +web_nlg_en,2,median,rouge2_fmeasure,0.05592276690064219 +web_nlg_en,3,PALM_prompt,rouge2_fmeasure,0.05799188686736059 +web_nlg_en,3,median,rouge2_fmeasure,0.05799188686736059 +web_nlg_en,4,PALM_prompt,rouge2_fmeasure,0.05856459210667893 +web_nlg_en,4,median,rouge2_fmeasure,0.05856459210667893 +web_nlg_en,5,PALM_prompt,rouge2_fmeasure,0.05924660282751187 +web_nlg_en,5,median,rouge2_fmeasure,0.05924660282751187 +web_nlg_en,5,average,multiple,0.056018101858914975 +wiki_lingua_en,0,tldr_en,rouge2_fmeasure,0.040460580826441606 +wiki_lingua_en,0,median,rouge2_fmeasure,0.040460580826441606 +wiki_lingua_en,1,tldr_en,rouge2_fmeasure,0.047516585339244355 +wiki_lingua_en,1,median,rouge2_fmeasure,0.047516585339244355 +wiki_lingua_en,2,tldr_en,rouge2_fmeasure,0.05037415373416898 +wiki_lingua_en,2,median,rouge2_fmeasure,0.05037415373416898 +wiki_lingua_en,3,tldr_en,rouge2_fmeasure,0.0413255105224322 +wiki_lingua_en,3,median,rouge2_fmeasure,0.0413255105224322 +wiki_lingua_en,4,tldr_en,rouge2_fmeasure,0.012185104729686681 +wiki_lingua_en,4,median,rouge2_fmeasure,0.012185104729686681 +wiki_lingua_en,5,tldr_en,rouge2_fmeasure,0.002227060333018499 +wiki_lingua_en,5,median,rouge2_fmeasure,0.002227060333018499 +wiki_lingua_en,5,average,multiple,0.03234816591416539 diff --git a/4b284b6bc4seed4/evaluation/generation/merged.json b/4b284b6bc4seed4/evaluation/generation/merged.json new file mode 100644 index 0000000000000000000000000000000000000000..5d5e416a64dedea18771f69351292959b4bfed58 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/merged.json @@ -0,0 +1 @@ +{"GEM/web_nlg_en": {"0": {"PALM_prompt": {"bleu": 0.35166211431807476, "bleu_stderr": 0.038071413053652275, "rouge1_fmeasure": 0.1064177979826906, "rouge1_fmeasure_stderr": 0.002014407824130901, "rouge1_precision": 0.06996455274792455, "rouge1_precision_stderr": 0.0015592090868851113, "rouge1_recall": 0.3142067124043025, "rouge1_recall_stderr": 0.0048759710824468425, "rouge2_fmeasure": 0.04977759217169638, "rouge2_fmeasure_stderr": 0.0012651503383739272, "rouge2_precision": 0.0322534557054686, "rouge2_precision_stderr": 0.0009291159250523059, "rouge2_recall": 0.15163416252366027, "rouge2_recall_stderr": 0.003394361327422675, "rougeL_fmeasure": 0.10151875678161845, "rougeL_fmeasure_stderr": 0.0018675156066895481, "rougeL_precision": 0.0665503328402659, "rougeL_precision_stderr": 0.0014349991462073507, "rougeL_recall": 0.30272317644546903, "rougeL_recall_stderr": 0.004757737332652531, "rougeLsum_fmeasure": 0.1005468816321386, "rougeLsum_fmeasure_stderr": 0.0018871768805081306, "rougeLsum_precision": 0.06618311419871553, "rougeLsum_precision_stderr": 0.0014716875527080561, "rougeLsum_recall": 0.29700852030137187, "rougeLsum_recall_stderr": 0.004591273606148228}}, "1": {"PALM_prompt": {"bleu": 0.5073000336177755, "bleu_stderr": 0.05344474459205947, "rouge1_fmeasure": 0.11830423680079659, "rouge1_fmeasure_stderr": 0.0020114505178455027, "rouge1_precision": 0.07583504538763819, "rouge1_precision_stderr": 0.001486787446354916, "rouge1_recall": 0.3716954850162639, "rouge1_recall_stderr": 0.005205035164096044, "rouge2_fmeasure": 0.0546051702795999, "rouge2_fmeasure_stderr": 0.0012569436349181779, "rouge2_precision": 0.03495776879514267, "rouge2_precision_stderr": 0.0009075777652215385, "rouge2_recall": 0.17885977259906066, "rouge2_recall_stderr": 0.003619881028179333, "rougeL_fmeasure": 0.1099788832885831, "rougeL_fmeasure_stderr": 0.0017852180819479216, "rougeL_precision": 0.07030089422838176, "rougeL_precision_stderr": 0.001298347917395423, "rougeL_recall": 0.34696500909784356, "rougeL_recall_stderr": 0.00482360237080409, "rougeLsum_fmeasure": 0.1110119989726, "rougeLsum_fmeasure_stderr": 0.0018755811955381053, "rougeLsum_precision": 0.07122182052038024, "rougeLsum_precision_stderr": 0.0013897967007664056, "rougeLsum_recall": 0.3477576171750515, "rougeLsum_recall_stderr": 0.0047659276141866136}}, "2": {"PALM_prompt": {"bleu": 0.5965263236594742, "bleu_stderr": 0.05163954961828016, "rouge1_fmeasure": 0.12233537069614382, "rouge1_fmeasure_stderr": 0.0019128091926460928, "rouge1_precision": 0.07783318626900966, "rouge1_precision_stderr": 0.0014071193338354882, "rouge1_recall": 0.39287654613370876, "rouge1_recall_stderr": 0.005155876341027884, "rouge2_fmeasure": 0.05592276690064219, "rouge2_fmeasure_stderr": 0.001197562574066807, "rouge2_precision": 0.0354373968856108, "rouge2_precision_stderr": 0.0008545023435501012, "rouge2_recall": 0.19039459495393043, "rouge2_recall_stderr": 0.003663120720639406, "rougeL_fmeasure": 0.11320053656812012, "rougeL_fmeasure_stderr": 0.001703639135984389, "rougeL_precision": 0.07188967304527148, "rougeL_precision_stderr": 0.0012421548275795777, "rougeL_recall": 0.3648630199526146, "rougeL_recall_stderr": 0.004750553642386819, "rougeLsum_fmeasure": 0.1142026340807714, "rougeLsum_fmeasure_stderr": 0.0017614419186672153, "rougeLsum_precision": 0.07268380811649039, "rougeLsum_precision_stderr": 0.0012997045865083563, "rougeLsum_recall": 0.36691870218506767, "rougeLsum_recall_stderr": 0.004689100059731652}}, "3": {"PALM_prompt": {"bleu": 0.6590445507565462, "bleu_stderr": 0.03731228606768085, "rouge1_fmeasure": 0.1255592398663772, "rouge1_fmeasure_stderr": 0.0018984572804718245, "rouge1_precision": 0.07980698513957299, "rouge1_precision_stderr": 0.00144116669925528, "rouge1_recall": 0.40871250304941253, "rouge1_recall_stderr": 0.005277184107543118, "rouge2_fmeasure": 0.05799188686736059, "rouge2_fmeasure_stderr": 0.0012470877418224642, "rouge2_precision": 0.036737647094888005, "rouge2_precision_stderr": 0.0009490563555727562, "rouge2_recall": 0.2012500620682874, "rouge2_recall_stderr": 0.003837876814963123, "rougeL_fmeasure": 0.11563164980687576, "rougeL_fmeasure_stderr": 0.0017088580020787614, "rougeL_precision": 0.07344239380035893, "rougeL_precision_stderr": 0.001301053396600686, "rougeL_recall": 0.37652823939289803, "rougeL_recall_stderr": 0.0048219321223642725, "rougeLsum_fmeasure": 0.1170142277810441, "rougeLsum_fmeasure_stderr": 0.0017619775635762797, "rougeLsum_precision": 0.07446732582003722, "rougeLsum_precision_stderr": 0.0013512166475080024, "rougeLsum_recall": 0.37983284753458935, "rougeLsum_recall_stderr": 0.004768406523815667}}, "4": {"PALM_prompt": {"bleu": 0.6612094103636722, "bleu_stderr": 0.05316688615822092, "rouge1_fmeasure": 0.12810389443498593, "rouge1_fmeasure_stderr": 0.0018474124639315977, "rouge1_precision": 0.0814867015244332, "rouge1_precision_stderr": 0.00140335178133597, "rouge1_recall": 0.41970698412830326, "rouge1_recall_stderr": 0.005264636607062869, "rouge2_fmeasure": 0.05856459210667893, "rouge2_fmeasure_stderr": 0.0011483796934916865, "rouge2_precision": 0.03716974645311799, "rouge2_precision_stderr": 0.000858671949423613, "rouge2_recall": 0.20569650614003127, "rouge2_recall_stderr": 0.0037797450322498744, "rougeL_fmeasure": 0.11674639728784307, "rougeL_fmeasure_stderr": 0.0016142840608080332, "rougeL_precision": 0.07414197510231946, "rougeL_precision_stderr": 0.0012218676591713073, "rougeL_recall": 0.3844479540779492, "rougeL_recall_stderr": 0.004824012642018971, "rougeLsum_fmeasure": 0.11883717065008154, "rougeLsum_fmeasure_stderr": 0.0017051707976467297, "rougeLsum_precision": 0.07570666678042967, "rougeLsum_precision_stderr": 0.0013105985925116346, "rougeLsum_recall": 0.3891045320252018, "rougeLsum_recall_stderr": 0.004752985303492144}}, "5": {"PALM_prompt": {"bleu": 0.7275241684724033, "bleu_stderr": 0.025139024300557544, "rouge1_fmeasure": 0.12807283189555618, "rouge1_fmeasure_stderr": 0.0018561044445990925, "rouge1_precision": 0.08119001231813255, "rouge1_precision_stderr": 0.0014308370032712263, "rouge1_recall": 0.42544190008314364, "rouge1_recall_stderr": 0.005347650585072293, "rouge2_fmeasure": 0.05924660282751187, "rouge2_fmeasure_stderr": 0.0011837956870791252, "rouge2_precision": 0.037488476057553025, "rouge2_precision_stderr": 0.0009127843819336664, "rouge2_recall": 0.21034382299607524, "rouge2_recall_stderr": 0.0038365434728806005, "rougeL_fmeasure": 0.1163811957107418, "rougeL_fmeasure_stderr": 0.0016389675453477302, "rougeL_precision": 0.07373330048793485, "rougeL_precision_stderr": 0.0012777957450006742, "rougeL_recall": 0.38841487576118355, "rougeL_recall_stderr": 0.004859412970167045, "rougeLsum_fmeasure": 0.11860693664537329, "rougeLsum_fmeasure_stderr": 0.0017120447774363115, "rougeLsum_precision": 0.07528625093598806, "rougeLsum_precision_stderr": 0.0013390502316204457, "rougeLsum_recall": 0.39421410712837596, "rougeLsum_recall_stderr": 0.004856189403160334}}}, "GEM/wiki_lingua_en": {"0": {"tldr_en": {"bleu": 1.8709275972877584, "bleu_stderr": 0.058898637546592025, "rouge1_fmeasure": 0.18622713587913528, "rouge1_fmeasure_stderr": 0.0018412460647723918, "rouge1_precision": 0.15946778937891515, "rouge1_precision_stderr": 0.0019263515035577486, "rouge1_recall": 0.2715850357160657, "rouge1_recall_stderr": 0.0027017071210897574, "rouge2_fmeasure": 0.040460580826441606, "rouge2_fmeasure_stderr": 0.0008960319674160765, "rouge2_precision": 0.03438888805377945, "rouge2_precision_stderr": 0.0008080459258315309, "rouge2_recall": 0.06117675765752758, "rouge2_recall_stderr": 0.0015061198705940962, "rougeL_fmeasure": 0.14446880136361956, "rougeL_fmeasure_stderr": 0.0013159464984661877, "rougeL_precision": 0.12211228339854341, "rougeL_precision_stderr": 0.0013298965520439228, "rougeL_recall": 0.21625650856608786, "rougeL_recall_stderr": 0.0022314529211675395, "rougeLsum_fmeasure": 0.1716160186471173, "rougeLsum_fmeasure_stderr": 0.0016894452306051078, "rougeLsum_precision": 0.1467045219684518, "rougeLsum_precision_stderr": 0.0017626659229341545, "rougeLsum_recall": 0.25116019588094557, "rougeLsum_recall_stderr": 0.0025177140997767675}}, "1": {"tldr_en": {"bleu": 2.3540646113466352, "bleu_stderr": 0.058383312223254456, "rouge1_fmeasure": 0.2051454909041775, "rouge1_fmeasure_stderr": 0.001963503184239578, "rouge1_precision": 0.17861978084436733, "rouge1_precision_stderr": 0.0021557050699636633, "rouge1_recall": 0.29492911982793857, "rouge1_recall_stderr": 0.0027364010294303274, "rouge2_fmeasure": 0.047516585339244355, "rouge2_fmeasure_stderr": 0.0009726713638331002, "rouge2_precision": 0.04216196051123768, "rouge2_precision_stderr": 0.0009857371725593724, "rouge2_recall": 0.06892249984818269, "rouge2_recall_stderr": 0.0015097658330848196, "rougeL_fmeasure": 0.14783021982665137, "rougeL_fmeasure_stderr": 0.00133667062385201, "rougeL_precision": 0.1277101470262864, "rougeL_precision_stderr": 0.0014839765534000772, "rougeL_recall": 0.21755280146548553, "rougeL_recall_stderr": 0.0021188768570991334, "rougeLsum_fmeasure": 0.1927127973435724, "rougeLsum_fmeasure_stderr": 0.0018361383918979964, "rougeLsum_precision": 0.16764488030279848, "rougeLsum_precision_stderr": 0.002021292385911164, "rougeLsum_recall": 0.2778932641853077, "rougeLsum_recall_stderr": 0.0025900462140142086}}, "2": {"tldr_en": {"bleu": 2.5117616289013234, "bleu_stderr": 0.07882958513520422, "rouge1_fmeasure": 0.2125892107712728, "rouge1_fmeasure_stderr": 0.0018726113691632032, "rouge1_precision": 0.1867354040241945, "rouge1_precision_stderr": 0.0021764534616989487, "rouge1_recall": 0.307356685382873, "rouge1_recall_stderr": 0.002668787558898061, "rouge2_fmeasure": 0.05037415373416898, "rouge2_fmeasure_stderr": 0.0009688792622757568, "rouge2_precision": 0.044945343265659306, "rouge2_precision_stderr": 0.0010090897572849198, "rouge2_recall": 0.07429122479757874, "rouge2_recall_stderr": 0.0015703671923323263, "rougeL_fmeasure": 0.15111305737547598, "rougeL_fmeasure_stderr": 0.0012722677867412764, "rougeL_precision": 0.13207273293373048, "rougeL_precision_stderr": 0.0015334022424691339, "rougeL_recall": 0.22372031586233712, "rougeL_recall_stderr": 0.002107048468174928, "rougeLsum_fmeasure": 0.20022450371280426, "rougeLsum_fmeasure_stderr": 0.0017542714847597852, "rougeLsum_precision": 0.1758960740764525, "rougeLsum_precision_stderr": 0.0020592289423643946, "rougeLsum_recall": 0.2900411283233057, "rougeLsum_recall_stderr": 0.0025253027294766133}}, "3": {"tldr_en": {"bleu": 2.403113898933743, "bleu_stderr": 0.053251073858493, "rouge1_fmeasure": 0.17575906704306832, "rouge1_fmeasure_stderr": 0.002174949765654744, "rouge1_precision": 0.1591881844404937, "rouge1_precision_stderr": 0.0024467695339504187, "rouge1_recall": 0.25516734786727036, "rouge1_recall_stderr": 0.0032356801874518703, "rouge2_fmeasure": 0.0413255105224322, "rouge2_fmeasure_stderr": 0.000931832765467482, "rouge2_precision": 0.03784379091188361, "rouge2_precision_stderr": 0.001089131871792838, "rouge2_recall": 0.0624780077769272, "rouge2_recall_stderr": 0.0016087440931355302, "rougeL_fmeasure": 0.12628359782789042, "rougeL_fmeasure_stderr": 0.0015182895930992903, "rougeL_precision": 0.11442394801240031, "rougeL_precision_stderr": 0.0018112801572746817, "rougeL_recall": 0.18773348293405673, "rougeL_recall_stderr": 0.002527108820020842, "rougeLsum_fmeasure": 0.16530823720647217, "rougeLsum_fmeasure_stderr": 0.0020367190470455404, "rougeLsum_precision": 0.14968568215454517, "rougeLsum_precision_stderr": 0.002308127867301231, "rougeLsum_recall": 0.2408810647537952, "rougeLsum_recall_stderr": 0.0030822171919214422}}, "4": {"tldr_en": {"bleu": 0.472345677088637, "bleu_stderr": 0.040900356286228075, "rouge1_fmeasure": 0.0557867591334426, "rouge1_fmeasure_stderr": 0.00186394804170534, "rouge1_precision": 0.052405749034228705, "rouge1_precision_stderr": 0.0020110499867171685, "rouge1_recall": 0.08478707705138788, "rouge1_recall_stderr": 0.0028865777805548412, "rouge2_fmeasure": 0.012185104729686681, "rouge2_fmeasure_stderr": 0.0005907016058266906, "rouge2_precision": 0.011080419003140766, "rouge2_precision_stderr": 0.0006523070791806857, "rouge2_recall": 0.01999068467854864, "rouge2_recall_stderr": 0.001096551185475821, "rougeL_fmeasure": 0.04111644120483341, "rougeL_fmeasure_stderr": 0.0013476527639030426, "rougeL_precision": 0.03862877667774788, "rougeL_precision_stderr": 0.0014997122070137985, "rougeL_recall": 0.0641687643508006, "rougeL_recall_stderr": 0.002226474813987104, "rougeLsum_fmeasure": 0.052305917688342855, "rougeLsum_fmeasure_stderr": 0.0017400550554708667, "rougeLsum_precision": 0.04914657123032221, "rougeLsum_precision_stderr": 0.0018810939013272998, "rougeLsum_recall": 0.07980206255787106, "rougeLsum_recall_stderr": 0.0027207315430338498}}, "5": {"tldr_en": {"bleu": 6.538062149513937e-07, "bleu_stderr": 1.1494813563989744e-06, "rouge1_fmeasure": 0.00898341548277317, "rouge1_fmeasure_stderr": 0.0008281424457556686, "rouge1_precision": 0.008509363653553257, "rouge1_precision_stderr": 0.000845658818252671, "rouge1_recall": 0.01382276652509776, "rouge1_recall_stderr": 0.0013334225811003739, "rouge2_fmeasure": 0.002227060333018499, "rouge2_fmeasure_stderr": 0.0002638537239607946, "rouge2_precision": 0.0019932915366697277, "rouge2_precision_stderr": 0.0002440516250439588, "rouge2_recall": 0.004040972091745142, "rouge2_recall_stderr": 0.0006014270152725088, "rougeL_fmeasure": 0.006634289847575651, "rougeL_fmeasure_stderr": 0.0006061194677904214, "rougeL_precision": 0.006364757119046798, "rougeL_precision_stderr": 0.0006395473026447492, "rougeL_recall": 0.010409531448448452, "rougeL_recall_stderr": 0.0010327387282074423, "rougeLsum_fmeasure": 0.008483394098012836, "rougeLsum_fmeasure_stderr": 0.0007802466552819305, "rougeLsum_precision": 0.00802904222397337, "rougeLsum_precision_stderr": 0.0007953313177037809, "rougeLsum_recall": 0.013136908473646484, "rougeLsum_recall_stderr": 0.0012773726821035238}}}, "e2e_nlg_cleaned": {"0": {"generate_text_restaurant": {"bleu": 0.20344702036475212, "bleu_stderr": 0.020813423545746928, "rouge1_fmeasure": 0.02272612382623739, "rouge1_fmeasure_stderr": 0.000657613160095564, "rouge1_precision": 0.02031066874429793, "rouge1_precision_stderr": 0.0010982973394100017, "rouge1_recall": 0.0339006777431073, "rouge1_recall_stderr": 0.0010754582360608094, "rouge2_fmeasure": 0.0021610970637232323, "rouge2_fmeasure_stderr": 0.00025014704785064965, "rouge2_precision": 0.004428962002328776, "rouge2_precision_stderr": 0.0010133668145643837, "rouge2_recall": 0.0032484488515415436, "rouge2_recall_stderr": 0.00039041664574734875, "rougeL_fmeasure": 0.022638837838076648, "rougeL_fmeasure_stderr": 0.000646894021986954, "rougeL_precision": 0.02023890948503867, "rougeL_precision_stderr": 0.001094108815755343, "rougeL_recall": 0.03378068019453833, "rougeL_recall_stderr": 0.0010619663136781138, "rougeLsum_fmeasure": 0.021275240072120734, "rougeLsum_fmeasure_stderr": 0.0005850724780177193, "rougeLsum_precision": 0.019207655955704183, "rougeLsum_precision_stderr": 0.0010760427436256133, "rougeLsum_recall": 0.03164987205173273, "rougeLsum_recall_stderr": 0.0009558614487519096}}, "1": {"generate_text_restaurant": {"bleu": 6.931679880377635, "bleu_stderr": 0.12521222343600627, "rouge1_fmeasure": 0.35867604679541404, "rouge1_fmeasure_stderr": 0.0022242609651642654, "rouge1_precision": 0.34003150968688334, "rouge1_precision_stderr": 0.003075339331446666, "rouge1_recall": 0.45015732570626815, "rouge1_recall_stderr": 0.0028997064403193467, "rouge2_fmeasure": 0.15367455208735437, "rouge2_fmeasure_stderr": 0.0016232409779530833, "rouge2_precision": 0.14759589015368266, "rouge2_precision_stderr": 0.002060777542304401, "rouge2_recall": 0.1951244486489613, "rouge2_recall_stderr": 0.0020953412261598093, "rougeL_fmeasure": 0.2708573841017006, "rougeL_fmeasure_stderr": 0.0016414160973280045, "rougeL_precision": 0.25480483800873843, "rougeL_precision_stderr": 0.0023341935238719103, "rougeL_recall": 0.3465181251792575, "rougeL_recall_stderr": 0.0024646626498150185, "rougeLsum_fmeasure": 0.29387614768355197, "rougeLsum_fmeasure_stderr": 0.0021153745644870423, "rougeLsum_precision": 0.2799685955963331, "rougeLsum_precision_stderr": 0.0028032299642029843, "rougeLsum_recall": 0.3677356916274029, "rougeLsum_recall_stderr": 0.0026996771832412166}}, "2": {"generate_text_restaurant": {"bleu": 7.657232828965316, "bleu_stderr": 0.12471874140369284, "rouge1_fmeasure": 0.3776586411733957, "rouge1_fmeasure_stderr": 0.002198646985806164, "rouge1_precision": 0.35675768591806567, "rouge1_precision_stderr": 0.0031022663155459203, "rouge1_recall": 0.46937017367708633, "rouge1_recall_stderr": 0.00275346130622528, "rouge2_fmeasure": 0.17010386224275442, "rouge2_fmeasure_stderr": 0.0016283471019571314, "rouge2_precision": 0.16231756057946886, "rouge2_precision_stderr": 0.0020395417907086693, "rouge2_recall": 0.2138289664047894, "rouge2_recall_stderr": 0.0020707270316515283, "rougeL_fmeasure": 0.28123834488197835, "rougeL_fmeasure_stderr": 0.0016069446891559397, "rougeL_precision": 0.26310458036396617, "rougeL_precision_stderr": 0.002272981131996748, "rougeL_recall": 0.35664473399252883, "rougeL_recall_stderr": 0.0023940807408273975, "rougeLsum_fmeasure": 0.30825756247609604, "rougeLsum_fmeasure_stderr": 0.0020874241622850045, "rougeLsum_precision": 0.2914642398591572, "rougeLsum_precision_stderr": 0.002757164859310039, "rougeLsum_recall": 0.3829945698750505, "rougeLsum_recall_stderr": 0.0026117917187163785}}, "3": {"generate_text_restaurant": {"bleu": 8.442104172996691, "bleu_stderr": 0.1225265310989897, "rouge1_fmeasure": 0.39418201029816835, "rouge1_fmeasure_stderr": 0.0021766899975066423, "rouge1_precision": 0.37510123434341147, "rouge1_precision_stderr": 0.0029659588823890727, "rouge1_recall": 0.47688116434271155, "rouge1_recall_stderr": 0.002779761613350503, "rouge2_fmeasure": 0.18042060590724515, "rouge2_fmeasure_stderr": 0.0016663829828460059, "rouge2_precision": 0.1722185872161438, "rouge2_precision_stderr": 0.001982108880961337, "rouge2_recall": 0.22148343783169197, "rouge2_recall_stderr": 0.0021298024706319753, "rougeL_fmeasure": 0.2871477669735601, "rougeL_fmeasure_stderr": 0.0016369768534961649, "rougeL_precision": 0.2708367244008351, "rougeL_precision_stderr": 0.002174690044000994, "rougeL_recall": 0.35404771153503223, "rougeL_recall_stderr": 0.002443187318628693, "rougeLsum_fmeasure": 0.3246521112217336, "rougeLsum_fmeasure_stderr": 0.002119544362824107, "rougeLsum_precision": 0.30935204172558023, "rougeLsum_precision_stderr": 0.0026977427492078823, "rougeLsum_recall": 0.3923447311858455, "rougeLsum_recall_stderr": 0.0026716176658316635}}, "4": {"generate_text_restaurant": {"bleu": 9.264771481612339, "bleu_stderr": 0.14797632752636197, "rouge1_fmeasure": 0.4086207638030011, "rouge1_fmeasure_stderr": 0.0020852610120524026, "rouge1_precision": 0.3925987211674676, "rouge1_precision_stderr": 0.0026976461573692354, "rouge1_recall": 0.47354063069748037, "rouge1_recall_stderr": 0.0026338292343196816, "rouge2_fmeasure": 0.18703841259223752, "rouge2_fmeasure_stderr": 0.0016890429531878357, "rouge2_precision": 0.1796234616071412, "rouge2_precision_stderr": 0.0018685574967649593, "rouge2_recall": 0.2190905542412407, "rouge2_recall_stderr": 0.002068607728271308, "rougeL_fmeasure": 0.29515772076134655, "rougeL_fmeasure_stderr": 0.0016661150684501613, "rougeL_precision": 0.2819581010790434, "rougeL_precision_stderr": 0.002044363363394681, "rougeL_recall": 0.346344258787895, "rougeL_recall_stderr": 0.0023161012828013965, "rougeLsum_fmeasure": 0.3382507422373424, "rougeLsum_fmeasure_stderr": 0.0021124639320887124, "rougeLsum_precision": 0.32521791939739797, "rougeLsum_precision_stderr": 0.0025320061675288244, "rougeLsum_recall": 0.3913010253854303, "rougeLsum_recall_stderr": 0.0025849947764755407}}, "5": {"generate_text_restaurant": {"bleu": 9.958980611111656, "bleu_stderr": 0.14855771135694565, "rouge1_fmeasure": 0.4197228631027415, "rouge1_fmeasure_stderr": 0.0020063425382385058, "rouge1_precision": 0.4061514037393209, "rouge1_precision_stderr": 0.0025821552864821757, "rouge1_recall": 0.47804480569363766, "rouge1_recall_stderr": 0.002643357770719704, "rouge2_fmeasure": 0.1931509426359425, "rouge2_fmeasure_stderr": 0.001665707134510459, "rouge2_precision": 0.18757831560333757, "rouge2_precision_stderr": 0.001891660346486441, "rouge2_recall": 0.2218502429628836, "rouge2_recall_stderr": 0.0020386307840161645, "rougeL_fmeasure": 0.3017298916186032, "rougeL_fmeasure_stderr": 0.0017018141577312348, "rougeL_precision": 0.2911232268001962, "rougeL_precision_stderr": 0.0020806579815607195, "rougeL_recall": 0.3466822060660839, "rougeL_recall_stderr": 0.002329148139407088, "rougeLsum_fmeasure": 0.35086688827184365, "rougeLsum_fmeasure_stderr": 0.0020482132353444454, "rougeLsum_precision": 0.33992936633595283, "rougeLsum_precision_stderr": 0.0024759755832926282, "rougeLsum_recall": 0.39927240691403565, "rougeLsum_recall_stderr": 0.0025795756365194628}}}, "gem_xsum": {"0": {"article_DOC_summary": {"bleu": 1.7847107445080181, "bleu_stderr": 0.12259281036544756, "rouge1_fmeasure": 0.20091233893732696, "rouge1_fmeasure_stderr": 0.002460990636185999, "rouge1_precision": 0.14717191874948962, "rouge1_precision_stderr": 0.002039989999763031, "rouge1_recall": 0.34130886710278735, "rouge1_recall_stderr": 0.004109809014072106, "rouge2_fmeasure": 0.04296352475719179, "rouge2_fmeasure_stderr": 0.0015091336137169667, "rouge2_precision": 0.031180276988501406, "rouge2_precision_stderr": 0.0011515924925153934, "rouge2_recall": 0.0750546362679565, "rouge2_recall_stderr": 0.002664189585730598, "rougeL_fmeasure": 0.15294193870162445, "rougeL_fmeasure_stderr": 0.0018589320642533784, "rougeL_precision": 0.11187209453346593, "rougeL_precision_stderr": 0.0015620035707168242, "rougeL_recall": 0.26167076851220833, "rougeL_recall_stderr": 0.0032523973074039445, "rougeLsum_fmeasure": 0.15798602735496012, "rougeLsum_fmeasure_stderr": 0.0020505297987330412, "rougeLsum_precision": 0.11548986592851035, "rougeLsum_precision_stderr": 0.0016848405957502828, "rougeLsum_recall": 0.27023318122685785, "rougeLsum_recall_stderr": 0.0035574900499767722}}, "1": {"article_DOC_summary": {"bleu": 1.1845032944798495, "bleu_stderr": 0.08458246586222135, "rouge1_fmeasure": 0.17024912689462188, "rouge1_fmeasure_stderr": 0.0023476916428796877, "rouge1_precision": 0.12097137240313847, "rouge1_precision_stderr": 0.0017496349490089252, "rouge1_recall": 0.2990148200796171, "rouge1_recall_stderr": 0.003991241961142267, "rouge2_fmeasure": 0.030605161726994057, "rouge2_fmeasure_stderr": 0.0012798169612394362, "rouge2_precision": 0.021525610014554653, "rouge2_precision_stderr": 0.0009005470188155159, "rouge2_recall": 0.055447375013310755, "rouge2_recall_stderr": 0.002401181861336932, "rougeL_fmeasure": 0.13223813090153158, "rougeL_fmeasure_stderr": 0.0017763582648502928, "rougeL_precision": 0.09373642633960022, "rougeL_precision_stderr": 0.001306812474264428, "rougeL_recall": 0.23409871583030145, "rougeL_recall_stderr": 0.0031894294773192737, "rougeLsum_fmeasure": 0.13796987863879345, "rougeLsum_fmeasure_stderr": 0.0019475228863655185, "rougeLsum_precision": 0.0978239478590475, "rougeLsum_precision_stderr": 0.0014318544124746646, "rougeLsum_recall": 0.24391576493442443, "rougeLsum_recall_stderr": 0.0034515787165719444}}, "2": {"article_DOC_summary": {"bleu": 1.235087762721956, "bleu_stderr": 0.12954971142620794, "rouge1_fmeasure": 0.17123176762196604, "rouge1_fmeasure_stderr": 0.002367991688636443, "rouge1_precision": 0.12153696089604207, "rouge1_precision_stderr": 0.0017564783405385376, "rouge1_recall": 0.30200065000392107, "rouge1_recall_stderr": 0.004133147911453231, "rouge2_fmeasure": 0.03194665621464301, "rouge2_fmeasure_stderr": 0.0012704379487708378, "rouge2_precision": 0.022397648703525567, "rouge2_precision_stderr": 0.0008966352941752963, "rouge2_recall": 0.05865756100278522, "rouge2_recall_stderr": 0.002417706489905652, "rougeL_fmeasure": 0.13347870518175978, "rougeL_fmeasure_stderr": 0.001810460575841908, "rougeL_precision": 0.09454924200528139, "rougeL_precision_stderr": 0.0013285980685601034, "rougeL_recall": 0.23705948565261042, "rougeL_recall_stderr": 0.0033238074174046623, "rougeLsum_fmeasure": 0.13805797792168725, "rougeLsum_fmeasure_stderr": 0.0019538992181766693, "rougeLsum_precision": 0.09773827044948902, "rougeLsum_precision_stderr": 0.0014279562335011396, "rougeLsum_recall": 0.24540888083433957, "rougeLsum_recall_stderr": 0.0035863376843111756}}, "3": {"article_DOC_summary": {"bleu": 1.2530842896627028, "bleu_stderr": 0.1292510298416823, "rouge1_fmeasure": 0.1640154958358604, "rouge1_fmeasure_stderr": 0.0025105121490214565, "rouge1_precision": 0.11912123096636808, "rouge1_precision_stderr": 0.001985064027306789, "rouge1_recall": 0.284241972897382, "rouge1_recall_stderr": 0.00429277701738966, "rouge2_fmeasure": 0.03073680556060331, "rouge2_fmeasure_stderr": 0.0012970855907124138, "rouge2_precision": 0.022035764094734074, "rouge2_precision_stderr": 0.0009495941851705396, "rouge2_recall": 0.05485929060591564, "rouge2_recall_stderr": 0.0023528230640158182, "rougeL_fmeasure": 0.12797306233278474, "rougeL_fmeasure_stderr": 0.0018874238035470816, "rougeL_precision": 0.09256740744943301, "rougeL_precision_stderr": 0.0014688063331016958, "rougeL_recall": 0.2237667779749703, "rougeL_recall_stderr": 0.0033868663103060566, "rougeLsum_fmeasure": 0.13064448950535576, "rougeLsum_fmeasure_stderr": 0.0020334528859491884, "rougeLsum_precision": 0.09452589861322153, "rougeLsum_precision_stderr": 0.0015705338179864972, "rougeLsum_recall": 0.22814994714493522, "rougeLsum_recall_stderr": 0.0036128044767980974}}, "4": {"article_DOC_summary": {"bleu": 0.5139598974348316, "bleu_stderr": 0.11912575032590099, "rouge1_fmeasure": 0.04359155004979404, "rouge1_fmeasure_stderr": 0.002446009970548131, "rouge1_precision": 0.036060956179475516, "rouge1_precision_stderr": 0.002146455590056505, "rouge1_recall": 0.0690610482890532, "rouge1_recall_stderr": 0.003982103092460407, "rouge2_fmeasure": 0.007201974037466402, "rouge2_fmeasure_stderr": 0.0006993387361055898, "rouge2_precision": 0.00544898809262409, "rouge2_precision_stderr": 0.0005451635252349526, "rouge2_recall": 0.012376718286934233, "rouge2_recall_stderr": 0.001258378038487793, "rougeL_fmeasure": 0.034064899256478404, "rougeL_fmeasure_stderr": 0.0019036508052699063, "rougeL_precision": 0.02859153283892875, "rougeL_precision_stderr": 0.0017520581139644556, "rougeL_recall": 0.0540675976921445, "rougeL_recall_stderr": 0.0031205628190529014, "rougeLsum_fmeasure": 0.035141373500357204, "rougeLsum_fmeasure_stderr": 0.0019687859509567853, "rougeLsum_precision": 0.02946392180089849, "rougeLsum_precision_stderr": 0.0018091240355730465, "rougeLsum_recall": 0.05579499878286511, "rougeLsum_recall_stderr": 0.0032320807958250114}}, "5": {"article_DOC_summary": {"bleu": 1.5223289746048162e-36, "bleu_stderr": 3.669632606867041e-32, "rouge1_fmeasure": 0.0026631982951325368, "rouge1_fmeasure_stderr": 0.0007488447516617362, "rouge1_precision": 0.00304016734736987, "rouge1_precision_stderr": 0.000888339058787168, "rouge1_recall": 0.002441151228222129, "rouge1_recall_stderr": 0.0006688844091459975, "rouge2_fmeasure": 0.00041201488569909625, "rouge2_fmeasure_stderr": 0.0002949309636685756, "rouge2_precision": 0.0005433276798426632, "rouge2_precision_stderr": 0.00039244433049951473, "rouge2_recall": 0.00033315740862910673, "rouge2_recall_stderr": 0.0002365408622759455, "rougeL_fmeasure": 0.0019214818091001502, "rougeL_fmeasure_stderr": 0.0005698678616813168, "rougeL_precision": 0.002191679085043183, "rougeL_precision_stderr": 0.000685805567529641, "rougeL_recall": 0.0017718084851004953, "rougeL_recall_stderr": 0.0005070173978560121, "rougeLsum_fmeasure": 0.001998668773079567, "rougeLsum_fmeasure_stderr": 0.000600651825136055, "rougeLsum_precision": 0.002284463934531111, "rougeLsum_precision_stderr": 0.0007267983753519665, "rougeLsum_recall": 0.0018384573787288605, "rougeLsum_recall_stderr": 0.000531115868075893}}}} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json new file mode 100644 index 0000000000000000000000000000000000000000..addc0952e85ecd04ef592b43170e026078811908 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.35166211431807476, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.038071413053652275 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.06996455274792455, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0015592090868851113 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3142067124043025, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0048759710824468425 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1064177979826906, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002014407824130901 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0322534557054686, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009291159250523059 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.15163416252366027, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003394361327422675 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.04977759217169638, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012651503383739272 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.0665503328402659, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014349991462073507 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.30272317644546903, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004757737332652531 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.10151875678161845, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0018675156066895481 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.06618311419871553, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0014716875527080561 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.29700852030137187, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004591273606148228 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1005468816321386, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018871768805081306 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json new file mode 100644 index 0000000000000000000000000000000000000000..2a56beaeb73bdd0286a02be0515339bb401c40dd --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5073000336177755, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05344474459205947 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07583504538763819, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.001486787446354916 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.3716954850162639, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005205035164096044 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.11830423680079659, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0020114505178455027 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03495776879514267, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009075777652215385 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.17885977259906066, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003619881028179333 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.0546051702795999, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012569436349181779 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07030089422838176, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001298347917395423 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.34696500909784356, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.00482360237080409 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1099788832885831, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017852180819479216 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07122182052038024, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013897967007664056 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3477576171750515, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0047659276141866136 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1110119989726, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018755811955381053 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json new file mode 100644 index 0000000000000000000000000000000000000000..6a1bcaac3263e7c6cd12e73d4c7f0ae21a10586b --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.5965263236594742, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05163954961828016 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07783318626900966, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014071193338354882 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.39287654613370876, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005155876341027884 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12233537069614382, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0019128091926460928 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.0354373968856108, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008545023435501012 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.19039459495393043, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003663120720639406 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05592276690064219, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.001197562574066807 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07188967304527148, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012421548275795777 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3648630199526146, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004750553642386819 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11320053656812012, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.001703639135984389 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07268380811649039, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0012997045865083563 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.36691870218506767, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004689100059731652 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1142026340807714, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017614419186672153 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json new file mode 100644 index 0000000000000000000000000000000000000000..22dd52aeddf672f6a2c90d37c4d7791b40aa291d --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6590445507565462, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.03731228606768085 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.07980698513957299, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00144116669925528 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.40871250304941253, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005277184107543118 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.1255592398663772, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018984572804718245 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.036737647094888005, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009490563555727562 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.2012500620682874, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.003837876814963123 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05799188686736059, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0012470877418224642 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07344239380035893, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.001301053396600686 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.37652823939289803, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0048219321223642725 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11563164980687576, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0017088580020787614 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07446732582003722, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013512166475080024 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.37983284753458935, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004768406523815667 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.1170142277810441, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017619775635762797 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json new file mode 100644 index 0000000000000000000000000000000000000000..4031741234d63af5254e45ba07f6761ac29e5e1c --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.6612094103636722, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.05316688615822092 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.0814867015244332, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.00140335178133597 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.41970698412830326, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005264636607062869 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12810389443498593, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018474124639315977 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.03716974645311799, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.000858671949423613 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.20569650614003127, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0037797450322498744 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05856459210667893, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011483796934916865 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07414197510231946, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012218676591713073 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.3844479540779492, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004824012642018971 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.11674639728784307, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016142840608080332 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07570666678042967, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013105985925116346 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.3891045320252018, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004752985303492144 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11883717065008154, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017051707976467297 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json new file mode 100644 index 0000000000000000000000000000000000000000..bba9c4550462ddcc603c773ed224c5e96379cd0a --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-web_nlg_en_PALM_prompt_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "bleu": 0.7275241684724033, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.025139024300557544 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_precision": 0.08119001231813255, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0014308370032712263 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_recall": 0.42544190008314364, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.005347650585072293 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge1_fmeasure": 0.12807283189555618, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018561044445990925 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_precision": 0.037488476057553025, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009127843819336664 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_recall": 0.21034382299607524, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0038365434728806005 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rouge2_fmeasure": 0.05924660282751187, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0011837956870791252 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_precision": 0.07373330048793485, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0012777957450006742 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_recall": 0.38841487576118355, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.004859412970167045 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeL_fmeasure": 0.1163811957107418, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0016389675453477302 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_precision": 0.07528625093598806, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0013390502316204457 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_recall": 0.39421410712837596, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.004856189403160334 + }, + { + "task_name": "GEM/web_nlg_en", + "prompt_name": "PALM_prompt", + "rougeLsum_fmeasure": 0.11860693664537329, + "dataset_path": "GEM/web_nlg", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017120447774363115 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json new file mode 100644 index 0000000000000000000000000000000000000000..17bb6cac293a6dd0ca36690b0ea4af36ecadad1f --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.15946778937891515, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0019263515035577486 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.2715850357160657, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027017071210897574 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.18622713587913528, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018412460647723918 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03438888805377945, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0008080459258315309 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06117675765752758, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015061198705940962 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.040460580826441606, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0008960319674160765 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.12211228339854341, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0013298965520439228 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21625650856608786, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0022314529211675395 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14446880136361956, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013159464984661877 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1467045219684518, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0017626659229341545 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.25116019588094557, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025177140997767675 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1716160186471173, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0016894452306051078 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 1.8709275972877584, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.058898637546592025 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json new file mode 100644 index 0000000000000000000000000000000000000000..78b04dea302acee64a8f9769f2d414790442df28 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.17861978084436733, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0021557050699636633 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.29492911982793857, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0027364010294303274 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.2051454909041775, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.001963503184239578 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.04216196051123768, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0009857371725593724 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.06892249984818269, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015097658330848196 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.047516585339244355, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009726713638331002 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.1277101470262864, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014839765534000772 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.21755280146548553, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0021188768570991334 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.14783021982665137, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.00133667062385201 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.16764488030279848, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002021292385911164 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2778932641853077, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025900462140142086 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.1927127973435724, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0018361383918979964 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.3540646113466352, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.058383312223254456 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json new file mode 100644 index 0000000000000000000000000000000000000000..a29c4c6371da9ec3b030ec172c9c8e912124f6e0 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1867354040241945, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0021764534616989487 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.307356685382873, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.002668787558898061 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.2125892107712728, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0018726113691632032 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.044945343265659306, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0010090897572849198 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.07429122479757874, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0015703671923323263 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.05037415373416898, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0009688792622757568 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.13207273293373048, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0015334022424691339 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.22372031586233712, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002107048468174928 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.15111305737547598, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0012722677867412764 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.1758960740764525, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0020592289423643946 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2900411283233057, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0025253027294766133 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.20022450371280426, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017542714847597852 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.5117616289013234, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.07882958513520422 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json new file mode 100644 index 0000000000000000000000000000000000000000..163e5b95a0735ca298cb122b5561a37b42fdee77 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.1591881844404937, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0024467695339504187 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.25516734786727036, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0032356801874518703 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.17575906704306832, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.002174949765654744 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.03784379091188361, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.001089131871792838 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.0624780077769272, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0016087440931355302 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.0413255105224322, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.000931832765467482 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.11442394801240031, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0018112801572746817 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.18773348293405673, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002527108820020842 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.12628359782789042, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0015182895930992903 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.14968568215454517, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.002308127867301231 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.2408810647537952, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0030822171919214422 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.16530823720647217, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020367190470455404 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 2.403113898933743, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.053251073858493 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json new file mode 100644 index 0000000000000000000000000000000000000000..6ea51b43d02f06ce14a0ea90b3345e497c698247 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.052405749034228705, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.0020110499867171685 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.08478707705138788, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0028865777805548412 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.0557867591334426, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.00186394804170534 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.011080419003140766, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0006523070791806857 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.01999068467854864, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.001096551185475821 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.012185104729686681, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0005907016058266906 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.03862877667774788, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0014997122070137985 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.0641687643508006, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.002226474813987104 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.04111644120483341, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0013476527639030426 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.04914657123032221, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0018810939013272998 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.07980206255787106, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0027207315430338498 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.052305917688342855, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0017400550554708667 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 0.472345677088637, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 0.040900356286228075 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json new file mode 100644 index 0000000000000000000000000000000000000000..251ac02b4599312b049dd598fd820bee102290f2 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_GEM-wiki_lingua_en_tldr_en_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_precision": 0.008509363653553257, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_precision_stderr": 0.000845658818252671 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_recall": 0.01382276652509776, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_recall_stderr": 0.0013334225811003739 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge1_fmeasure": 0.00898341548277317, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge1_fmeasure_stderr": 0.0008281424457556686 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_precision": 0.0019932915366697277, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_precision_stderr": 0.0002440516250439588 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_recall": 0.004040972091745142, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_recall_stderr": 0.0006014270152725088 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rouge2_fmeasure": 0.002227060333018499, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rouge2_fmeasure_stderr": 0.0002638537239607946 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_precision": 0.006364757119046798, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_precision_stderr": 0.0006395473026447492 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_recall": 0.010409531448448452, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_recall_stderr": 0.0010327387282074423 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeL_fmeasure": 0.006634289847575651, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeL_fmeasure_stderr": 0.0006061194677904214 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_precision": 0.00802904222397337, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_precision_stderr": 0.0007953313177037809 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_recall": 0.013136908473646484, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_recall_stderr": 0.0012773726821035238 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "rougeLsum_fmeasure": 0.008483394098012836, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0007802466552819305 + }, + { + "task_name": "GEM/wiki_lingua_en", + "prompt_name": "tldr_en", + "bleu": 6.538062149513937e-07, + "dataset_path": "GEM/wiki_lingua", + "dataset_name": "en", + "subset": null, + "bleu_stderr": 1.1494813563989744e-06 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json new file mode 100644 index 0000000000000000000000000000000000000000..1930086cef823d24ba2c245fd5c3f87ae50ab2e4 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 0.20344702036475212, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.020813423545746928 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.02031066874429793, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0010982973394100017 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.0339006777431073, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0010754582360608094 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.02272612382623739, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.000657613160095564 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.004428962002328776, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0010133668145643837 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.0032484488515415436, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.00039041664574734875 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.0021610970637232323, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.00025014704785064965 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.02023890948503867, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.001094108815755343 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.03378068019453833, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0010619663136781138 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.022638837838076648, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.000646894021986954 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.019207655955704183, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0010760427436256133 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.03164987205173273, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0009558614487519096 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.021275240072120734, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0005850724780177193 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json new file mode 100644 index 0000000000000000000000000000000000000000..ebac2655651b369c3bc41017ce45ad5eeec857e1 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 6.931679880377635, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12521222343600627 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.34003150968688334, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.003075339331446666 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.45015732570626815, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0028997064403193467 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.35867604679541404, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0022242609651642654 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.14759589015368266, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.002060777542304401 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.1951244486489613, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020953412261598093 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.15367455208735437, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0016232409779530833 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.25480483800873843, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0023341935238719103 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3465181251792575, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0024646626498150185 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2708573841017006, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016414160973280045 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2799685955963331, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0028032299642029843 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3677356916274029, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026996771832412166 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.29387614768355197, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021153745644870423 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json new file mode 100644 index 0000000000000000000000000000000000000000..ea088cf4e58b09b03c4d994f290171389681c49f --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 7.657232828965316, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.12471874140369284 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.35675768591806567, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0031022663155459203 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.46937017367708633, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.00275346130622528 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.3776586411733957, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.002198646985806164 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.16231756057946886, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0020395417907086693 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2138289664047894, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020707270316515283 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.17010386224275442, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0016283471019571314 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.26310458036396617, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002272981131996748 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35664473399252883, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023940807408273975 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.28123834488197835, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016069446891559397 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.2914642398591572, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.002757164859310039 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3829945698750505, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026117917187163785 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.30825756247609604, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020874241622850045 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json new file mode 100644 index 0000000000000000000000000000000000000000..8bae361e06fd47d8f9664be969d7a2791784682c --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 8.442104172996691, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.1225265310989897 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.37510123434341147, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0029659588823890727 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.47688116434271155, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002779761613350503 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.39418201029816835, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0021766899975066423 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.1722185872161438, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.001982108880961337 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.22148343783169197, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0021298024706319753 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.18042060590724515, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0016663829828460059 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2708367244008351, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002174690044000994 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.35404771153503223, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002443187318628693 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.2871477669735601, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016369768534961649 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.30935204172558023, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0026977427492078823 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3923447311858455, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0026716176658316635 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3246521112217336, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.002119544362824107 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json new file mode 100644 index 0000000000000000000000000000000000000000..19762426d2dd463313fbb6d5241a7ded97c22680 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.264771481612339, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14797632752636197 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.3925987211674676, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0026976461573692354 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.47354063069748037, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.0026338292343196816 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4086207638030011, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020852610120524026 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.1796234616071412, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.0018685574967649593 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2190905542412407, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.002068607728271308 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.18703841259223752, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.0016890429531878357 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2819581010790434, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.002044363363394681 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.346344258787895, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.0023161012828013965 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.29515772076134655, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0016661150684501613 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.32521791939739797, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0025320061675288244 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.3913010253854303, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025849947764755407 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.3382507422373424, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0021124639320887124 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json new file mode 100644 index 0000000000000000000000000000000000000000..b4f6751c5bb889611ab6e6ce4ec7690d46615bf6 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_e2e_nlg_cleaned_generate_text_restaurant_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "bleu": 9.958980611111656, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "bleu_stderr": 0.14855771135694565 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_precision": 0.4061514037393209, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_precision_stderr": 0.0025821552864821757 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_recall": 0.47804480569363766, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_recall_stderr": 0.002643357770719704 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge1_fmeasure": 0.4197228631027415, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge1_fmeasure_stderr": 0.0020063425382385058 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_precision": 0.18757831560333757, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_precision_stderr": 0.001891660346486441 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_recall": 0.2218502429628836, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_recall_stderr": 0.0020386307840161645 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rouge2_fmeasure": 0.1931509426359425, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rouge2_fmeasure_stderr": 0.001665707134510459 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_precision": 0.2911232268001962, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_precision_stderr": 0.0020806579815607195 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_recall": 0.3466822060660839, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_recall_stderr": 0.002329148139407088 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeL_fmeasure": 0.3017298916186032, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeL_fmeasure_stderr": 0.0017018141577312348 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_precision": 0.33992936633595283, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_precision_stderr": 0.0024759755832926282 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_recall": 0.39927240691403565, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_recall_stderr": 0.0025795756365194628 + }, + { + "task_name": "e2e_nlg_cleaned", + "prompt_name": "generate_text_restaurant", + "rougeLsum_fmeasure": 0.35086688827184365, + "dataset_path": "e2e_nlg_cleaned", + "dataset_name": null, + "subset": null, + "rougeLsum_fmeasure_stderr": 0.0020482132353444454 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_0.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_0.json new file mode 100644 index 0000000000000000000000000000000000000000..d4703950a325edf68df4cfb1601b08cdc0c5adcb --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_0.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.14717191874948962, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002039989999763031 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.34130886710278735, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004109809014072106 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.20091233893732696, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002460990636185999 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.031180276988501406, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0011515924925153934 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.0750546362679565, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002664189585730598 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.04296352475719179, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0015091336137169667 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.11187209453346593, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0015620035707168242 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.26167076851220833, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0032523973074039445 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.15294193870162445, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018589320642533784 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.11548986592851035, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0016848405957502828 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.27023318122685785, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035574900499767722 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.15798602735496012, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020505297987330412 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.7847107445080181, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.12259281036544756 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 0, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_1.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_1.json new file mode 100644 index 0000000000000000000000000000000000000000..8fbee7983e1190f323a91b5957b214edcf8c2e08 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_1.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12097137240313847, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017496349490089252 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.2990148200796171, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003991241961142267 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17024912689462188, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0023476916428796877 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.021525610014554653, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009005470188155159 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.055447375013310755, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002401181861336932 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.030605161726994057, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012798169612394362 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09373642633960022, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.001306812474264428 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23409871583030145, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0031894294773192737 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13223813090153158, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0017763582648502928 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.0978239478590475, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014318544124746646 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24391576493442443, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0034515787165719444 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13796987863879345, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019475228863655185 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.1845032944798495, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.08458246586222135 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 1, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_2.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_2.json new file mode 100644 index 0000000000000000000000000000000000000000..86045c5c7b44fb53eab1cefacbd55cb5bfae3886 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_2.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.12153696089604207, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.0017564783405385376 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.30200065000392107, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.004133147911453231 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.17123176762196604, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002367991688636443 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.022397648703525567, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0008966352941752963 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05865756100278522, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.002417706489905652 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03194665621464301, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012704379487708378 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09454924200528139, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0013285980685601034 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.23705948565261042, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033238074174046623 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.13347870518175978, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.001810460575841908 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09773827044948902, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0014279562335011396 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.24540888083433957, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0035863376843111756 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13805797792168725, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019538992181766693 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.235087762721956, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.12954971142620794 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 2, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_3.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_3.json new file mode 100644 index 0000000000000000000000000000000000000000..96e92178992b8e82641f79b221fc5587c70a0613 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_3.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.11912123096636808, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.001985064027306789 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.284241972897382, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.00429277701738966 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.1640154958358604, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0025105121490214565 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.022035764094734074, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0009495941851705396 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.05485929060591564, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0023528230640158182 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.03073680556060331, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0012970855907124138 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.09256740744943301, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0014688063331016958 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.2237667779749703, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0033868663103060566 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.12797306233278474, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0018874238035470816 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.09452589861322153, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0015705338179864972 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.22814994714493522, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0036128044767980974 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.13064448950535576, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0020334528859491884 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.2530842896627028, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.1292510298416823 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 3, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_4.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_4.json new file mode 100644 index 0000000000000000000000000000000000000000..94784dbd2bfea028fb998edb4db66ab82c2a34b0 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_4.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.036060956179475516, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.002146455590056505 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.0690610482890532, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.003982103092460407 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.04359155004979404, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.002446009970548131 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.00544898809262409, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.0005451635252349526 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.012376718286934233, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.001258378038487793 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.007201974037466402, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0006993387361055898 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.02859153283892875, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.0017520581139644556 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0540675976921445, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0031205628190529014 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.034064899256478404, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0019036508052699063 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.02946392180089849, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0018091240355730465 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.05579499878286511, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.0032320807958250114 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.035141373500357204, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.0019687859509567853 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 0.5139598974348316, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 0.11912575032590099 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 4, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_5.json b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d47b42cc21626b7232093e4bcf81c3abd5f5744c --- /dev/null +++ b/4b284b6bc4seed4/evaluation/generation/slim.4b284b6bc4seed4_gem_xsum_article_DOC_summary_5.json @@ -0,0 +1,133 @@ +{ + "results": [ + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_precision": 0.00304016734736987, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_precision_stderr": 0.000888339058787168 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_recall": 0.002441151228222129, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_recall_stderr": 0.0006688844091459975 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge1_fmeasure": 0.0026631982951325368, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge1_fmeasure_stderr": 0.0007488447516617362 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_precision": 0.0005433276798426632, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_precision_stderr": 0.00039244433049951473 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_recall": 0.00033315740862910673, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_recall_stderr": 0.0002365408622759455 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rouge2_fmeasure": 0.00041201488569909625, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rouge2_fmeasure_stderr": 0.0002949309636685756 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_precision": 0.002191679085043183, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_precision_stderr": 0.000685805567529641 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_recall": 0.0017718084851004953, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_recall_stderr": 0.0005070173978560121 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeL_fmeasure": 0.0019214818091001502, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeL_fmeasure_stderr": 0.0005698678616813168 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_precision": 0.002284463934531111, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_precision_stderr": 0.0007267983753519665 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_recall": 0.0018384573787288605, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_recall_stderr": 0.000531115868075893 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "rougeLsum_fmeasure": 0.001998668773079567, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "rougeLsum_fmeasure_stderr": 0.000600651825136055 + }, + { + "task_name": "gem_xsum", + "prompt_name": "article_DOC_summary", + "bleu": 1.5223289746048162e-36, + "dataset_path": "GEM/xsum", + "dataset_name": null, + "subset": "", + "bleu_stderr": 3.669632606867041e-32 + } + ], + "config": { + "model": "hf-causal", + "model_args": "pretrained=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/lm1-4b2-84b-c4seeds/4b284b6bc4seed4/transformers,use_accelerate=True,tokenizer=/pfs/lustrep4/scratch/project_462000119/muennighoff/nov-2022-bettercom/gpt2,dtype=bfloat16", + "task_args": "", + "num_fewshot": 5, + "batch_size": 16, + "device": "cuda", + "use_cache": false, + "limit": 3000, + "bootstrap_iters": 10, + "seed": 1234 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_0.csv b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_0.csv new file mode 100644 index 0000000000000000000000000000000000000000..20607edb10f6d0167930ab24eff431d24708b558 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_0.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.343,0.015019206922356951,0 +anli_r2,acc,0.329,0.014865395385928364,0 +anli_r3,acc,0.3333333333333333,0.0136139500102256,0 +arc_challenge,acc,0.2551194539249147,0.012739038695202105,0 +arc_challenge,acc_norm,0.2841296928327645,0.013179442447653886,0 +arc_easy,acc,0.5660774410774411,0.01016979577046211,0 +arc_easy,acc_norm,0.49873737373737376,0.010259750807991153,0 +boolq,acc,0.5685015290519878,0.008662594569027309,1 +cb,acc,0.39285714285714285,0.0658538889806635,1 +cb,f1,0.20571590265987547,,1 +copa,acc,0.73,0.044619604333847394,0 +hellaswag,acc,0.44453296156144195,0.004958983318274571,0 +hellaswag,acc_norm,0.5728938458474407,0.004936470085238491,0 +piqa,acc,0.7404787812840044,0.010227939888173922,0 +piqa,acc_norm,0.7459194776931447,0.010157271999135051,0 +rte,acc,0.48014440433212996,0.0300727231673172,0 +sciq,acc,0.802,0.01260773393417531,0 +sciq,acc_norm,0.706,0.014414290540008215,0 +storycloze_2016,acc,0.7017637626937466,0.010579249795578815,0 +winogrande,acc,0.5619573796369376,0.013944181296470804,0 diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_0.json b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_0.json new file mode 100644 index 0000000000000000000000000000000000000000..6fde998e1abeb05b83eee61ceaeec3a875993cfc --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_0.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.343, + "acc_stderr": 0.015019206922356951 + }, + "anli_r2": { + "acc": 0.329, + "acc_stderr": 0.014865395385928364 + }, + "anli_r3": { + "acc": 0.3333333333333333, + "acc_stderr": 0.0136139500102256 + }, + "cb": { + "acc": 0.39285714285714285, + "acc_stderr": 0.0658538889806635, + "f1": 0.20571590265987547 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.044619604333847394 + }, + "hellaswag": { + "acc": 0.44453296156144195, + "acc_stderr": 0.004958983318274571, + "acc_norm": 0.5728938458474407, + "acc_norm_stderr": 0.004936470085238491 + }, + "rte": { + "acc": 0.48014440433212996, + "acc_stderr": 0.0300727231673172 + }, + "winogrande": { + "acc": 0.5619573796369376, + "acc_stderr": 0.013944181296470804 + }, + "storycloze_2016": { + "acc": 0.7017637626937466, + "acc_stderr": 0.010579249795578815 + }, + "boolq": { + "acc": 0.5685015290519878, + "acc_stderr": 0.008662594569027309 + }, + "arc_easy": { + "acc": 0.5660774410774411, + "acc_stderr": 0.01016979577046211, + "acc_norm": 0.49873737373737376, + "acc_norm_stderr": 0.010259750807991153 + }, + "arc_challenge": { + "acc": 0.2551194539249147, + "acc_stderr": 0.012739038695202105, + "acc_norm": 0.2841296928327645, + "acc_norm_stderr": 0.013179442447653886 + }, + "sciq": { + "acc": 0.802, + "acc_stderr": 0.01260773393417531, + "acc_norm": 0.706, + "acc_norm_stderr": 0.014414290540008215 + }, + "piqa": { + "acc": 0.7404787812840044, + "acc_stderr": 0.010227939888173922, + "acc_norm": 0.7459194776931447, + "acc_norm_stderr": 0.010157271999135051 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_1.csv b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_1.csv new file mode 100644 index 0000000000000000000000000000000000000000..9d5d85ee1eeeac162c086e2a4e36c2b873c68b62 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_1.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.328,0.014853842487270336,0 +anli_r2,acc,0.33,0.014876872027456738,0 +anli_r3,acc,0.35083333333333333,0.013782212417178204,0 +arc_challenge,acc,0.26791808873720135,0.012942030195136426,0 +arc_challenge,acc_norm,0.2858361774744027,0.013203196088537369,0 +arc_easy,acc,0.5761784511784511,0.010140006095213603,0 +arc_easy,acc_norm,0.5374579124579124,0.010230952104570798,0 +boolq,acc,0.5737003058103975,0.008649531625805671,1 +cb,acc,0.5,0.06741998624632421,1 +cb,f1,0.34491725768321513,,1 +copa,acc,0.73,0.04461960433384741,0 +hellaswag,acc,0.4425413264289982,0.004956724392646535,0 +hellaswag,acc_norm,0.5784704242182832,0.00492794806148606,0 +piqa,acc,0.7437431991294886,0.010185787831565056,0 +piqa,acc_norm,0.7383025027203483,0.010255630772708229,0 +rte,acc,0.5018050541516246,0.030096267148976626,0 +sciq,acc,0.836,0.011715000693181316,0 +sciq,acc_norm,0.788,0.01293148186493804,0 +storycloze_2016,acc,0.6937466595403528,0.010659088460112754,0 +winogrande,acc,0.5493291239147593,0.01398392886904024,0 diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_1.json b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_1.json new file mode 100644 index 0000000000000000000000000000000000000000..da8d2d88205b820387dd5230ab79951473cfc25b --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_1.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.328, + "acc_stderr": 0.014853842487270336 + }, + "anli_r2": { + "acc": 0.33, + "acc_stderr": 0.014876872027456738 + }, + "anli_r3": { + "acc": 0.35083333333333333, + "acc_stderr": 0.013782212417178204 + }, + "cb": { + "acc": 0.5, + "acc_stderr": 0.06741998624632421, + "f1": 0.34491725768321513 + }, + "copa": { + "acc": 0.73, + "acc_stderr": 0.04461960433384741 + }, + "hellaswag": { + "acc": 0.4425413264289982, + "acc_stderr": 0.004956724392646535, + "acc_norm": 0.5784704242182832, + "acc_norm_stderr": 0.00492794806148606 + }, + "rte": { + "acc": 0.5018050541516246, + "acc_stderr": 0.030096267148976626 + }, + "winogrande": { + "acc": 0.5493291239147593, + "acc_stderr": 0.01398392886904024 + }, + "storycloze_2016": { + "acc": 0.6937466595403528, + "acc_stderr": 0.010659088460112754 + }, + "boolq": { + "acc": 0.5737003058103975, + "acc_stderr": 0.008649531625805671 + }, + "arc_easy": { + "acc": 0.5761784511784511, + "acc_stderr": 0.010140006095213603, + "acc_norm": 0.5374579124579124, + "acc_norm_stderr": 0.010230952104570798 + }, + "arc_challenge": { + "acc": 0.26791808873720135, + "acc_stderr": 0.012942030195136426, + "acc_norm": 0.2858361774744027, + "acc_norm_stderr": 0.013203196088537369 + }, + "sciq": { + "acc": 0.836, + "acc_stderr": 0.011715000693181316, + "acc_norm": 0.788, + "acc_norm_stderr": 0.01293148186493804 + }, + "piqa": { + "acc": 0.7437431991294886, + "acc_stderr": 0.010185787831565056, + "acc_norm": 0.7383025027203483, + "acc_norm_stderr": 0.010255630772708229 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_2.csv b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_2.csv new file mode 100644 index 0000000000000000000000000000000000000000..000729a8a8e99943f26b7b711795d2372649712f --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_2.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.318,0.014734079309311901,0 +anli_r2,acc,0.34,0.014987482264363937,0 +anli_r3,acc,0.3516666666666667,0.013789711695404803,0 +arc_challenge,acc,0.2568259385665529,0.0127669237941168,0 +arc_challenge,acc_norm,0.295221843003413,0.013329750293382316,0 +arc_easy,acc,0.5976430976430976,0.010062244711011525,0 +arc_easy,acc_norm,0.5585016835016835,0.010189314382749927,0 +boolq,acc,0.5871559633027523,0.008611172430472871,1 +cb,acc,0.4642857142857143,0.0672477765493766,1 +cb,f1,0.3260233918128655,,1 +copa,acc,0.74,0.0440844002276808,0 +hellaswag,acc,0.44284007169886475,0.004957068377516515,0 +hellaswag,acc_norm,0.58105954989046,0.004923772581848488,0 +piqa,acc,0.7399347116430903,0.0102348932490613,0 +piqa,acc_norm,0.7470076169749728,0.010142888698862453,0 +rte,acc,0.48014440433212996,0.0300727231673172,0 +sciq,acc,0.847,0.011389500459665532,0 +sciq,acc_norm,0.809,0.012436787112179482,0 +storycloze_2016,acc,0.692143238909674,0.010674598158758175,0 +winogrande,acc,0.5548539857932123,0.01396766295435549,0 diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_2.json b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_2.json new file mode 100644 index 0000000000000000000000000000000000000000..19274cad77899e2706daa2d2c73ac1aad17ea95b --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_2.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.318, + "acc_stderr": 0.014734079309311901 + }, + "anli_r2": { + "acc": 0.34, + "acc_stderr": 0.014987482264363937 + }, + "anli_r3": { + "acc": 0.3516666666666667, + "acc_stderr": 0.013789711695404803 + }, + "cb": { + "acc": 0.4642857142857143, + "acc_stderr": 0.0672477765493766, + "f1": 0.3260233918128655 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.0440844002276808 + }, + "hellaswag": { + "acc": 0.44284007169886475, + "acc_stderr": 0.004957068377516515, + "acc_norm": 0.58105954989046, + "acc_norm_stderr": 0.004923772581848488 + }, + "rte": { + "acc": 0.48014440433212996, + "acc_stderr": 0.0300727231673172 + }, + "winogrande": { + "acc": 0.5548539857932123, + "acc_stderr": 0.01396766295435549 + }, + "storycloze_2016": { + "acc": 0.692143238909674, + "acc_stderr": 0.010674598158758175 + }, + "boolq": { + "acc": 0.5871559633027523, + "acc_stderr": 0.008611172430472871 + }, + "arc_easy": { + "acc": 0.5976430976430976, + "acc_stderr": 0.010062244711011525, + "acc_norm": 0.5585016835016835, + "acc_norm_stderr": 0.010189314382749927 + }, + "arc_challenge": { + "acc": 0.2568259385665529, + "acc_stderr": 0.0127669237941168, + "acc_norm": 0.295221843003413, + "acc_norm_stderr": 0.013329750293382316 + }, + "sciq": { + "acc": 0.847, + "acc_stderr": 0.011389500459665532, + "acc_norm": 0.809, + "acc_norm_stderr": 0.012436787112179482 + }, + "piqa": { + "acc": 0.7399347116430903, + "acc_stderr": 0.0102348932490613, + "acc_norm": 0.7470076169749728, + "acc_norm_stderr": 0.010142888698862453 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_3.csv b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_3.csv new file mode 100644 index 0000000000000000000000000000000000000000..db4de1a84cac1eafd920fb3c53a6662a2f8a520d --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_3.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.311,0.014645596385722692,0 +anli_r2,acc,0.357,0.015158521721486773,0 +anli_r3,acc,0.3233333333333333,0.01350837286730022,0 +arc_challenge,acc,0.2645051194539249,0.012889272949313366,0 +arc_challenge,acc_norm,0.2883959044368601,0.01323839442242817,0 +arc_easy,acc,0.5925925925925926,0.010082326627832865,0 +arc_easy,acc_norm,0.5656565656565656,0.010170943451269421,0 +boolq,acc,0.5776758409785933,0.008638883260317736,1 +cb,acc,0.5178571428571429,0.06737697508644647,1 +cb,f1,0.4390740542278427,,1 +copa,acc,0.75,0.04351941398892446,0 +hellaswag,acc,0.4457279426409082,0.004960299952519407,0 +hellaswag,acc_norm,0.5819557857000598,0.004922294797766662,0 +piqa,acc,0.7328618063112078,0.010323440492612445,0 +piqa,acc_norm,0.7437431991294886,0.010185787831565058,0 +rte,acc,0.5884476534296029,0.029621832222417196,0 +sciq,acc,0.863,0.010878848714333316,0 +sciq,acc_norm,0.821,0.012128730605719113,0 +storycloze_2016,acc,0.6926777124532336,0.010669445081866662,0 +winogrande,acc,0.5367008681925809,0.01401457845884326,0 diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_3.json b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_3.json new file mode 100644 index 0000000000000000000000000000000000000000..b29a95d5356e3fdd4ee8248b6b7823866298e368 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_3.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.311, + "acc_stderr": 0.014645596385722692 + }, + "anli_r2": { + "acc": 0.357, + "acc_stderr": 0.015158521721486773 + }, + "anli_r3": { + "acc": 0.3233333333333333, + "acc_stderr": 0.01350837286730022 + }, + "cb": { + "acc": 0.5178571428571429, + "acc_stderr": 0.06737697508644647, + "f1": 0.4390740542278427 + }, + "copa": { + "acc": 0.75, + "acc_stderr": 0.04351941398892446 + }, + "hellaswag": { + "acc": 0.4457279426409082, + "acc_stderr": 0.004960299952519407, + "acc_norm": 0.5819557857000598, + "acc_norm_stderr": 0.004922294797766662 + }, + "rte": { + "acc": 0.5884476534296029, + "acc_stderr": 0.029621832222417196 + }, + "winogrande": { + "acc": 0.5367008681925809, + "acc_stderr": 0.01401457845884326 + }, + "storycloze_2016": { + "acc": 0.6926777124532336, + "acc_stderr": 0.010669445081866662 + }, + "boolq": { + "acc": 0.5776758409785933, + "acc_stderr": 0.008638883260317736 + }, + "arc_easy": { + "acc": 0.5925925925925926, + "acc_stderr": 0.010082326627832865, + "acc_norm": 0.5656565656565656, + "acc_norm_stderr": 0.010170943451269421 + }, + "arc_challenge": { + "acc": 0.2645051194539249, + "acc_stderr": 0.012889272949313366, + "acc_norm": 0.2883959044368601, + "acc_norm_stderr": 0.01323839442242817 + }, + "sciq": { + "acc": 0.863, + "acc_stderr": 0.010878848714333316, + "acc_norm": 0.821, + "acc_norm_stderr": 0.012128730605719113 + }, + "piqa": { + "acc": 0.7328618063112078, + "acc_stderr": 0.010323440492612445, + "acc_norm": 0.7437431991294886, + "acc_norm_stderr": 0.010185787831565058 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_4.csv b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_4.csv new file mode 100644 index 0000000000000000000000000000000000000000..75525fbe6815c22046f0830e96434d2755411e62 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_4.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.365,0.015231776226264891,0 +anli_r2,acc,0.357,0.015158521721486778,0 +anli_r3,acc,0.3458333333333333,0.013736245342311014,0 +arc_challenge,acc,0.2525597269624573,0.012696728980207704,0 +arc_challenge,acc_norm,0.29436860068259385,0.013318528460539422,0 +arc_easy,acc,0.5925925925925926,0.010082326627832861,0 +arc_easy,acc_norm,0.5664983164983165,0.010168640625454101,0 +boolq,acc,0.5761467889908257,0.008643046537505769,1 +cb,acc,0.5357142857142857,0.06724777654937658,1 +cb,f1,0.3502178649237473,,1 +copa,acc,0.74,0.0440844002276808,0 +hellaswag,acc,0.442441744672376,0.0049566093272184015,0 +hellaswag,acc_norm,0.5873332005576578,0.004913076844433741,0 +piqa,acc,0.7366702937976061,0.010276185322196764,0 +piqa,acc_norm,0.7448313384113167,0.01017157159252183,0 +rte,acc,0.48736462093862815,0.030086851767188564,0 +sciq,acc,0.868,0.010709373963528031,0 +sciq,acc_norm,0.838,0.01165726777130442,0 +storycloze_2016,acc,0.694815606627472,0.010648664383985668,0 +winogrande,acc,0.5469613259668509,0.013990366632148104,0 diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_4.json b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_4.json new file mode 100644 index 0000000000000000000000000000000000000000..a3396441093de0349e6d5599d4a436009373d8b4 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_4.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.365, + "acc_stderr": 0.015231776226264891 + }, + "anli_r2": { + "acc": 0.357, + "acc_stderr": 0.015158521721486778 + }, + "anli_r3": { + "acc": 0.3458333333333333, + "acc_stderr": 0.013736245342311014 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.3502178649237473 + }, + "copa": { + "acc": 0.74, + "acc_stderr": 0.0440844002276808 + }, + "hellaswag": { + "acc": 0.442441744672376, + "acc_stderr": 0.0049566093272184015, + "acc_norm": 0.5873332005576578, + "acc_norm_stderr": 0.004913076844433741 + }, + "rte": { + "acc": 0.48736462093862815, + "acc_stderr": 0.030086851767188564 + }, + "winogrande": { + "acc": 0.5469613259668509, + "acc_stderr": 0.013990366632148104 + }, + "storycloze_2016": { + "acc": 0.694815606627472, + "acc_stderr": 0.010648664383985668 + }, + "boolq": { + "acc": 0.5761467889908257, + "acc_stderr": 0.008643046537505769 + }, + "arc_easy": { + "acc": 0.5925925925925926, + "acc_stderr": 0.010082326627832861, + "acc_norm": 0.5664983164983165, + "acc_norm_stderr": 0.010168640625454101 + }, + "arc_challenge": { + "acc": 0.2525597269624573, + "acc_stderr": 0.012696728980207704, + "acc_norm": 0.29436860068259385, + "acc_norm_stderr": 0.013318528460539422 + }, + "sciq": { + "acc": 0.868, + "acc_stderr": 0.010709373963528031, + "acc_norm": 0.838, + "acc_norm_stderr": 0.01165726777130442 + }, + "piqa": { + "acc": 0.7366702937976061, + "acc_stderr": 0.010276185322196764, + "acc_norm": 0.7448313384113167, + "acc_norm_stderr": 0.01017157159252183 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_5.csv b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_5.csv new file mode 100644 index 0000000000000000000000000000000000000000..c3a2c140bec0814b5a046dfced45342be20a7579 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_5.csv @@ -0,0 +1,21 @@ +task,metric,value,err,version +anli_r1,acc,0.352,0.015110404505648677,0 +anli_r2,acc,0.343,0.015019206922356953,0 +anli_r3,acc,0.3425,0.013704669762934722,0 +arc_challenge,acc,0.2696245733788396,0.01296804068686915,0 +arc_challenge,acc_norm,0.2986348122866894,0.013374078615068756,0 +arc_easy,acc,0.5913299663299664,0.010087174498762883,0 +arc_easy,acc_norm,0.5627104377104377,0.010178768429321595,0 +boolq,acc,0.5825688073394495,0.00862499005021668,1 +cb,acc,0.5357142857142857,0.06724777654937658,1 +cb,f1,0.30043290043290044,,1 +copa,acc,0.76,0.04292346959909282,0 +hellaswag,acc,0.4446325433180641,0.004959094146471523,0 +hellaswag,acc_norm,0.589523999203346,0.004909148239488278,0 +piqa,acc,0.7285092491838956,0.010376251176596135,0 +piqa,acc_norm,0.7399347116430903,0.010234893249061287,0 +rte,acc,0.51985559566787,0.030072723167317177,0 +sciq,acc,0.874,0.010499249222408046,0 +sciq,acc_norm,0.843,0.01151014697923019,0 +storycloze_2016,acc,0.6953500801710315,0.010643426988646806,0 +winogrande,acc,0.56353591160221,0.01393856946567702,0 diff --git a/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_5.json b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_5.json new file mode 100644 index 0000000000000000000000000000000000000000..d158d1220dfae02894446ebd5e571a4d0e407b67 --- /dev/null +++ b/4b284b6bc4seed4/evaluation/rankeval/4b284b6bc4seed4_5.json @@ -0,0 +1,87 @@ +{ + "results": { + "anli_r1": { + "acc": 0.352, + "acc_stderr": 0.015110404505648677 + }, + "anli_r2": { + "acc": 0.343, + "acc_stderr": 0.015019206922356953 + }, + "anli_r3": { + "acc": 0.3425, + "acc_stderr": 0.013704669762934722 + }, + "cb": { + "acc": 0.5357142857142857, + "acc_stderr": 0.06724777654937658, + "f1": 0.30043290043290044 + }, + "copa": { + "acc": 0.76, + "acc_stderr": 0.04292346959909282 + }, + "hellaswag": { + "acc": 0.4446325433180641, + "acc_stderr": 0.004959094146471523, + "acc_norm": 0.589523999203346, + "acc_norm_stderr": 0.004909148239488278 + }, + "rte": { + "acc": 0.51985559566787, + "acc_stderr": 0.030072723167317177 + }, + "winogrande": { + "acc": 0.56353591160221, + "acc_stderr": 0.01393856946567702 + }, + "storycloze_2016": { + "acc": 0.6953500801710315, + "acc_stderr": 0.010643426988646806 + }, + "boolq": { + "acc": 0.5825688073394495, + "acc_stderr": 0.00862499005021668 + }, + "arc_easy": { + "acc": 0.5913299663299664, + "acc_stderr": 0.010087174498762883, + "acc_norm": 0.5627104377104377, + "acc_norm_stderr": 0.010178768429321595 + }, + "arc_challenge": { + "acc": 0.2696245733788396, + "acc_stderr": 0.01296804068686915, + "acc_norm": 0.2986348122866894, + "acc_norm_stderr": 0.013374078615068756 + }, + "sciq": { + "acc": 0.874, + "acc_stderr": 0.010499249222408046, + "acc_norm": 0.843, + "acc_norm_stderr": 0.01151014697923019 + }, + "piqa": { + "acc": 0.7285092491838956, + "acc_stderr": 0.010376251176596135, + "acc_norm": 0.7399347116430903, + "acc_norm_stderr": 0.010234893249061287 + } + }, + "versions": { + "anli_r1": 0, + "anli_r2": 0, + "anli_r3": 0, + "cb": 1, + "copa": 0, + "hellaswag": 0, + "rte": 0, + "winogrande": 0, + "storycloze_2016": 0, + "boolq": 1, + "arc_easy": 0, + "arc_challenge": 0, + "sciq": 0, + "piqa": 0 + } +} \ No newline at end of file diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3760dfa9d4ffdbfbee54bc438b751c761304dc2a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:793e42dd3f0096a55ba7be52031c94bcc3db60bc61e85edf01f2730ee44c60c7 +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09581b15a4ba2adb39d25a4785a82ff956797ea3 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_0_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:461a942d80d3a810551c9e1baf85ffb66eeb76c7b1b26536f915ee7fe088649f +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca6ac5d9e9979e1efc34ab8adba373741931f905 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d3312c2e2cedccd104f497306835de92623db5adc2af5b54e2ec6c8a2e9df06 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68c9e29eb2fc51f3acf36a9145346ccd8b1501d4 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_100_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5a26c1717fc8b09287eba2246b1788d343004daad7d875cd779432f97296733 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1dc2a202a1cf78034ca27b72cadc11eb719c820b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51d22643fa98155cc523efad38a8e937d771a243ce1d84a6baf3e793e6f5244e +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6939a41216130555c5a24eb36ac53320c6739988 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_101_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9004f58bf14b7d8f3a737c0ca8d8cb16aeb040c063fbadc5d514709cda7bf6ce +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e3be9bb43f412f91afb645eacdf7092f7d5c938a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ba27cd78cf450699e2ed32cd779e65af136af1634746a18accb692285b00e145 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..77068f6222dad6d6b91e2587bdecd85c4b90917a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_102_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0257b3f05aa45cd29743bc94b8139f9915e2eec3aba021e96607726738520f30 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4c55b77d864e1bd2f3c1a932b97316fd04550600 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8838aa16c29e82d2f75cbde50ab693f3bd6b0c9108a313360aa1469db5ea98e4 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..36fa689b875d412b46bc70855f165812f7fb5ee3 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_103_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86093ca2dd5abd48b01cca00915995b6ff50572af6396699a48db73ad3d3f4bd +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..46ee08b84c51d2f42ed7887c98c16935af6d90e3 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7938792b872abff7f75b837a2935b4daa54afdd005c6db0f470e89ac6a21838 +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1055ebf84bbef53039fd4bccb54652ed61d58071 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_104_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:122e392c55d452944f3fe059fb3453e575c9ca48cf7578c1b9659dbc7a148ce9 +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3bb122d1b8edb259c166f2329159ca58bf837223 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a050a72b105c389255ce99a652ca1fc188a853f360b5210f51a09d5304904383 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1e848d57ba2bb64d5a88c5f9392522af371586ea --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_105_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2026fdcd03686933be5083c6695f82421c20b4fd479abfc9646777407edd571c +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5447f4d57305aecfa6374a6696bcffa7bbd29e86 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ab14c0023784a738496c7889d00b232fa35cebb450c7e3ed1200a12c797d77fb +size 199058669 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5e2e890cd6fb33bd28f6d923abcc4e1960891624 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_106_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acccf0975108ce2df2e9c0e1710395c782fef7a7723e5bf274a4f13dcb725f82 +size 199058669 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e4a5d0769126d8321636ab29252e4afb82e1bf0 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:39d9a03ac765e18e367c9622ed4e3ea012838dfb9853bb647f9fa04b39da6727 +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ca06339b670d8c439cd6615b28c00567962fd537 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_107_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:302756b4c913250e3dcce40da1028a2789b9994d107ee0edd20c72fc518926b1 +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8f16ceaaa39b1e7860b524ffc21c14d9af081fce --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8519a61c2b049a5a573270d4e17cefa2baa0748c1745506a5a2d9e7ce341433 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2e5242b815c203dbc51bde062c228d506f020600 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_108_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6b15fc3f39433dbf4258a1f3f2df826a873635adba3a1fc63cbb0a2b1cdee631 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0d5047e2c39a5cbf4af07c8cebe9113a3e667a59 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25f160630b1141bb64a22abcd484fb1072fbacfc2329da1d09db8877fed0fd48 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..da787e963525c7d6ae74ea0e4e3d8b64b5d983f5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_109_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:87ca737ec9e5475490ff3deaf69fe9e3df51bb9867d8ad34332615603d0c9c25 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fc03120ba0ccee2b17177f836c18f2ef76fcaad3 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5875869354d9eefa6fe9b43e385865f9854372355a5467b96b096967227b7501 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..154e097fafe4a7dc43f1b67783da28cfa0ea4e05 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_10_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd607dbb90c8a40c879a193d39bab05f35e80dd73b74d49c383495f611b259c0 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b3ada194dad17ec3f38f352870f7b79bc1f196d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:218222590cc2c8e942d5264627dd09b6bb0b9acdf5c54339eccab6b82640c20c +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6ccc11a273b64ff4f007aa852e2b4187b3daec31 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_110_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6551e92f1c7d76934b2c049ae726424fb5feb95b6e310d8a8f2d647183613a89 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de384e1e710412607b5d0b577c5751d0b0201860 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3590b8a107aaad50ea3ecda35e43d20aea72215dbb22baf84e136bdc8d66b27e +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b86a16ed98e3f520bc3fe6a8dfe1d3220100fa1b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_111_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd1ffcd25bc11e3a4a9c2f6f75a21bb2329c32f982e3d87f457b171e76fba6c6 +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..22a1105e9debd4eecb47d4ac7e1d2c87e64cbe27 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3253a217a352a1048ff9cd4122f9a939c6902b160d892e930c78e7d1e8f7af1d +size 199058605 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fb053d89a0a8abf87dc35af32e8b665fc986229 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_112_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3d362041e491e74e7d1b368fdccef6fed273a469dcf774cd2b93dd6cd5993a7b +size 199058605 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..55e74bac684352db3b9ef27778891324370eda7c --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e78aef9bfe48245b7df686b04bc2752fa9ade22ae46fc57f62fdfd07bd1a33a6 +size 199058669 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..013ab4be9c0ccb403ec53c3b05adcad62b95ca58 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_113_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:431d846c11287b2ed4bc6483945a083084b9a99e6d44eda07e14f62320b26392 +size 199058669 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..640a6da4f21d2c03343c453751ec280ecf259cac --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c8070e7e434474ddc09c37268ae30219425b88cd69f99fe740bc78440918e58 +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e9e37f61385fe7738e4c72721ae00eab4e7f9b20 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_114_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1722746c141439449ea2798311bb384e886d7b910f58ac028498de4713679259 +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43f5fde6a2490edc6b1967a2facd3b2399b412b6 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0dccbd21ac474d977ea933f60ac77c413fdcb80baa7287cf338e350eadf43ab7 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..63d021d94675d94f5ce9d8d205a6de3be715aec8 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_115_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:23c0df5a1acd5477155920ec97f902905d75400ef05aa07255630faf08e2c9b3 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d8afeb105a36560071ed893b58cfdf93fd1e80a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81e676d97a6b32fda2350e71340923f096b9e25ed1a2c99f2fef9908b8ab1420 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c524e91270782df859fed3387e9994905dcca169 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_116_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0769be2f1524d84adce9bee7d4395c4f8940ea4ff41b41f7203472fd0186e838 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f05a012679a0806c7d4e62bfcde6261b31f993d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4154fc0676fb3a6765d4243966371440159b41f272994e7b138fc9fe616801c +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9179cc108c0e3c31bc8ebd8d782d6ce65c1aae54 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_117_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed3324531549a47d0f1838aff796f66256e4b39996a4c129a7c333a74c6f2f79 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d7fee63ba4e2c6a935fe36b12488a44f6e7271e5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e7801131b94dc32ec74a95cc03f1f0bdf190b0614bfa401dc933eb468e1dfc +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..01711139c65b73a125802c63b99a7740a19b0804 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_118_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d316967cb19a95a414e7d6cfdd2660b86fda7b382cb558a76ebac13e9d53c4b +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b4b630d4c7407c56d083e6e0afd6262dd6db27ac --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98d420cb60c516001cfafd3e4ffdb1d5899bb7252e90221889771d35026426b6 +size 199058669 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8e45be0f755eff687ba5853b4c0b858f198827b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_119_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:27092b9f82fd30e53aeccbb3fcdec7063aa2c31a783ac8316bf627c355e2cdd7 +size 199058669 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..835da8a9b563e061008cbee1f10df9af33b49f30 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1c8a57055876373c1aa34e26dfdcd11f2ef1aa753c86f4a8cf082e3e565f03ec +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a30bcbefde39b21d92447acf258c4067d976a3e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_11_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b68ac1767635cb8c45041432cb8a1fda9085c9e186f146c4cc0544f18313b753 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..42b417ec9c89193edbc101c63a212dc4120b8931 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c0fd3abae936a33d766b498fb73b2dc186b02569b08314c9a02362cd2d9ee605 +size 199058669 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f4ba6be8fb22b60d2b20fdbc1ee93db566961ef --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_120_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8f759a543f7762eef53975909ea8d122cdea8a3cfc233781c5a0212b7025256 +size 199058669 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bc38ed3dfe1fcc9db2516d6064c92760acec980 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0b20769d3124ad9bacd87765ecc6c6fbbc3521e06c1f9814b7e3897ead93b17c +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c85ccb0a66437eaa0cb5ee47781652d238412138 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_121_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d270aecc352a01e5fed03d4c6636b6a4bd6b8bedec390ec3094cc1cff07304e7 +size 199058797 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b1d5b68b884cf416eaa36ffb489191d4b8a57a3d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f35eb9cec74b34dc4acffa8c456b1670f501436a4ef87bf1553b9f7a686fd279 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee0ef747ee6d417013353d39c0d07bf97a35489d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_122_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b8b2c8ea9782a863ad6a4e889f02a858c5d259178e030a8596ce40eca1736e97 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4062b7bb318269d8cb46e0df48e4e282e56b9e28 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9f5ef4e3ca0c1add0763984fc0638e8c2e114093bef4980bd47080f1a16af982 +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2902ee281b2a2f48032b72f7fb0e550b38684777 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_123_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e3284b824e71e8bb80983659715e1b18cad61ea3984d83527d03ec34df131ec +size 199058733 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..87cfd83fd0c1ad14404120142da7ad646ba44f90 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ea2ce28e4f38b3ee23d066d1c44a0a3576a068d1d5e1233d5b65d3804c92ee7 +size 199058669 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1f474601e2f777479340720be3cf224548e471b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_124_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d306d768bc7a3712c8dfce986f26844c7ae8eb8b68736376a300c37f44c82fe9 +size 199058669 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b5d9be0e84b25f15960c243a137f5e227ca5f387 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6fcbfc64237bdb32c102dfd32680e755c0d7e83cfafa921422fa1f39fbe6615d +size 199058925 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8160af2993228a156943e3aa6259846397963b7 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_125_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:11e96707a72734547265cd1c7d705ea149b6b724f6672e174050d130172229bb +size 199058925 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1575315628108e3c9eb238bb5f8dc80b4f813cf1 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ea9af3a25b7d3385b38288c9dddce5417604edf8a19088f61a9c67306e3884d8 +size 199058605 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e7ebefe6114d60f76cce021c6a17e5e1c4efe663 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_126_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ef178b0db66848c1fe31968f76f06b0f7dcf695dd105fe63eeb729d3a04e02a +size 199058605 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d44462e8ce61daed0c57b532486a48508839b52 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a9722683ae2980cf3806d016d21534a30ddbf33149b63af763281f0be2d66def +size 199058605 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5efc86308229dff4ea739cc724f1b327c28ecfbd --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_127_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25e223f223bef51e996c583e266292084caacf5aa2a163cdeb60cc98b1d1497e +size 199058605 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bec41ffd74cf732e734ecb5e634dbaf75f12650a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1f84ec255eca817f1c7e10c1ddc2a54a70d31de46739325ac57130f8c6050180 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a7223c2d49542e7d7b98aceacc6102b7a1d83747 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_12_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2aa4bf4eef63f9935413e072c30df3c679266d5c6e7323a9ec0b64f4edb3ffe7 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4559a5e9d0acb5fa874b1aa67e4a7c4d9e928f83 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a5403ba3e5837538b4741c2aa82e8ecf6201843a2eed504a49612b7617b3a187 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3714d9f0ff8b61c45aae6af4faf7818345c02440 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_13_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:01c4dd4fcf98b87defad7afe7557be84f8cac2c2c18d318a12240548cb6afbc9 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8a045408e71dca6ed98112a7d5d255cf5c7b0756 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d088a8ec815e0648d58b64de7b583db71a1f40cf3506d4fead32ef00c0ca8af1 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d9e57d7f110ca8b7f0491d07772474246875e6b3 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_14_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:495cad650565820b7fca2e8c8423720d7b817084a23ac0749314d21aab7c220a +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0a357fc4c495358842fd2119f4776664877b175b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5a13ca9dff967eeb4c2a94dbad7970110d0a47375967e9a23c580ee54e3ccdfd +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d4324bdae42179cce288abb7ff62ef9e2ef90512 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_15_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e0980b79103314f7a76909deb794cbcd2f3dcfc7abf9af3441bb582614fef9a +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58e2fce21ff94c9ab5eeb96fb1a534585fba51df --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4fba27d7606c14ad77797dbd16935c74a8f0d3f4847bcdb463644a0bee56b72a +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..021a604066b581da3c39d5a59ed89415fbd01d2b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_16_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:78d8470b9be2aaf52347c42e30f267d28c422ba7d55d91f9b839284373f8654a +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e337bb930853ce6abc88a50dcaf169180729c05f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0da6fbb794cac9e11196b2da87144ebd8e2a66413aa8e243614c9ba0428debf7 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e275d4d08ba8e772b63f96bfc84e828bb0dab922 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_17_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9eb2b6a97eeb202db7374abba70a6deec9d089680b38e12c71f0ae9b6611d12d +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..088ac22d0274fdc54c8aeba5d927e04a9afd5943 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:728e9f8f790dbe54790569ef98c855803ac897ec33ec843d5325d70c171e705f +size 199058978 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..196e9ad74234916ca6c077c943766c6c6952e019 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_18_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9354fdded00a8337f5a986af2655a650b43440037893b17ef69b13c5ffd92a51 +size 199058978 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4d1ecabd6d08b815abbf14344b584af1e04d972 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b80314df0482d49bbdf16ac73fbc51b787adb49f0775bad881474dc35c9c14c7 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ef61accb8608f320b778bbd75e8ff8a590b54525 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_19_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:006ffb6c8847a1c9f30b98cd9e8259c99577ee2527313e0f541be011c9879af8 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1db1594c0638f60af6323fc080af8ab8fd6792e0 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3dbffcec17f80b427d4db76f0e914397ddc857d2dbfdb1773cb9c5ce79cb7f2f +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..67067fd98f1d3edffc5fe139d7318a6208dad2a2 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_1_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f4ad420148dc9a50308cc771d6a2a9ec531aa6174cdb761339152b2d1b9179e9 +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f1214c68870d04fc53208055564984caba8835b8 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6020482236ef1f32b20843e51752a74e1433b04a75b7af136b5f8f8d2a8f7d0d +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d323e190b87fe330d11c34058d630ca72bc2ba5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_20_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2106ed17f88715a0c45e270991da26acbc36403805b08ff4b5622e4fd794c2dc +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94d26460080c4f3de7fca434139aa478f1c7665e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:43f218d24e9739db497639820eab00ddf94caf35d73b3b72ba6efcf51c34b9c2 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8980e3ef62e87b72e76367709c0cb28720ba0cbc --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_21_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:49768a61cab974a9dc85a0d7ccaed35fe28dd9060eca788e898322efd65d47a9 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0ddc893c5993152b7d29f59b02f874fb8987d35 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2efaec3f9bc60c81342726be44ac0681e6499ca34e7cba0ee8afb6211ffc0bbe +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..189bfa0727140ce6425ef7dd7a13442c1b38b927 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_22_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1393268916aa629d05c1f786b03bef9b941585b172a2ddac8b2706438549db4 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4f66987fab991739c5af81e108a93bdc160b69e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:15d49eef91b06fc0dfcc167ad15c5c2ec38a7b4774df538bf35c6c39fc14882e +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fbbef9a301d5dc988015c60b9f7ee944698f4d03 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_23_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:99e9617747159026a22132745f1edbcd3ce97afe6bd7230fa48b7e5368902063 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..196bbbc82f53bae08596a0014cf7ad81b63cfe76 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6defde84536caada7d7863ccbd97d12be07b50d76457d0f7f9516bb63600ce6a +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa47b6efd60aef033edc42fbfe1146ecbbf2dca6 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_24_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:74b90a38095e01bfd80457ec840be0f32e4adcfee1174a846cf570c2084322c4 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..32dac4ce70fe01980cd4dba051cadbd712b2586c --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4ceb21f7a0337f9ac2ee909ebf194017bd481476628439445e9a943dfa8f2f56 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0914786b24cd520b234338cf846db0c3e00655a9 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_25_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:acd8bc66770b6e1d1499cabb8248b2c8c0e67a53bf05b208ab53f3bb2d44082b +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cbf4038e8fbaf022c7dfbcc6438ce8e23c7d30ee --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:584fea98f9472271629fbedf489c7ba2c411529519d686c998652a792393f6e5 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0ef7f6a1152cb34af149751339f93b37879e017 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_26_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1db5e7096dc44a3762e5e48911b4b5fe6185980d5a374cac73dec279d7fccd97 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bd676a7b4f4400ea9b74a60bcc684998734f558 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f3bcd0270c9f050d268c714b4fcfcae31eafe75c4b5da5ea34fe87f7ac368217 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c9e90ad6f705571f05c0b87ac8cc066b254d789d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_27_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:42190522d0683c0d77f26e86eea8175dc223e24d0372db5cab73cf83eb38fd33 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f8c3a45035911cc885c366010b85961b495e9d8 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:44b4d052dfa6524dd9f967e79903131eab9e3fcd25c868246e748cd541020dd0 +size 199058594 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..56d38d779b51c5730257dec0a64e5e84a68d9292 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_28_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0c6df56cbd3898e2b19357c1ad4869a8b9510cb588627c93abd6d8ccc3bc4087 +size 199058594 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cfcbd0666a7d4645a636100929e73895c8f4a4c7 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7cbdea148abb850bbfdb365fb6a2822c1a1862d0026e3dba5740b86fba2d433f +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1610bbf2db0e23e14c54e99a92a627a54d670a3 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_29_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:53504a9a9d70a16c4238831c978dccee7c36a3b20df65a1b764ea18df4e17bd1 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43c3cb8d904297e7ef808cb65f7fdfd6699a50ed --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc9edfb37e8ba7c810eaa6db80a6b012d883755b79d4080ec1a8030830f29a00 +size 199058711 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..94f9694eeb2aa997a10148b681f303164a4f8838 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_2_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2051225bd228d9d7b4f4b2d691482d6de879d70742da5584b5502c8ca38293b5 +size 199058711 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7a5b4720b775f3e12b530c59c8fd115d21491355 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7fdf936fa28286737d0796fa7a4cc59b0f262f1e21e97ddea9851c935d1884cc +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e1b184c0bbc85bde7325187baac8335cedc94e08 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_30_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1d51e6616e8d4da4833e9c796d603ea20751bf83b011d3968c94b46b958d8db2 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f615c8ab9e52bd319dd877d0a127fb3b27213dd --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8db31680247d6416fee7381d200f76ff8d58b13c363a6da7c21b1f8da6347016 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bc412c60125c97aa1c5f9816dd75f262d78b42af --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_31_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5d90682ba83419c22f017f394f5bac98e57dec148cdfcced387a6bd56f7d94d3 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16f8d2af407ff9561452bc000b5756efab766a5a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b520ee2e589f696deb7c5aad700aae0f168e10da751d273d926a78eaae9d5d68 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed9e13fdcf6c1199ab2df45aa7e3fa5a63b1e286 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_32_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47f9665a297b6dd816a87eee371c382c40f8064ead453f1890e52bda0065d0bc +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1ab5ad47660643549de0154b8e9e98ff42437517 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bb13ae223fc5ad8a0ad9272c89e19f023cd8fe18041b3e4dceb00320eda0a26 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93ae9b6da4d63fab531c5449fb05979459215dca --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_33_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:26ad20ed89981ed475d5eb4e107f8f6b7b05e1b6930839ac5778f901492645a1 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d36eac33e8a6410d509c6bde69098b994b7f8430 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:98220b6d9641085fbb744a36c04ae4dd6f8e147f528480e48163d1c8a6af4520 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..21b85262653025c8b736d5ca31b43eef0c32f875 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_34_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:131cc19ef47847b70c8f6f5ddf3d52310e7c564491027e06efda641029afb9db +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9f82ec8cfa20ed9599a34dcd97629e6be176d770 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c0c728d4497ae89f3fc2a7ec7eb5db6a2dca3c46301d73c94adeb72e15175bd +size 199058594 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d2000bf9d129633cc404e7e291cedd67e9246047 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_35_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3e0aed18787d3fa6d75e371eee88886f89712ff9cbbd13bf2925fa391a2d63ac +size 199058594 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5ce8fb192a0e059d8f7035e1ca50668e3060f08f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0f90973322c3c84a69735132b0fc5858364fd9dfe15c72f2f12d12a53d003f3c +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..80a43cd459389b18441ba5a113e0e98bbc62fdb5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_36_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3862e1e1b21596b40a84b9b90d38b05c09ea19055b1a18426751c9d0df6e00e6 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..494aa8d7ef7e4551424b39ab068f2bd4dd84f56e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eb78e1f9b158acf187b64b2e9026faeac5cf9e2193c2cfa78a1f13b8d8b985da +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7de6d818d0bd1ce2ec30a985fe9e7600af88236e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_37_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c9d4985e1454133cd1d67c912cdcce129899bd298f5562bfe1f93abac7373f18 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99368b50fa4213e6847026f09f740681da2b2ce0 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a74987639964aef9b5cffc8ad0796cf54271557884ed13dc0f5f79068aaed759 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..33b9b915915a306f8494094c2ede0f44fed39f11 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_38_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9012a3be9c66d9cf11485c50d0c61fa0ca63670474146c638185531c01ec84f2 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed55edf6fcc1461a71fe6bdbe6fc9dbc5c69ae46 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f7a0d665a127df9e233d291cb8fc83a9c73164f0b2aa29322dea80f1cfe9acc +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c37ac1cf2ffaf5032c34ba7f717ea1aca1c8c87 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_39_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:092ed155780c2395987c565f03c2edafac8232a45a64d029a6bec53e62e1cb4c +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1883e08a261986e6427f0abb68377b536e0873b3 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f52008c26623cbb53dd01fbe817e187a62b4542ffdaa778c22d7f7de79ccee4b +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d17ed8a12e4cce658799d92f1facc708d39e8ac --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_3_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa02b65696081c6c88e803cae6f4fb0190f700db972b6dd4e0242e9faad8dde8 +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..487e95238314094cfec206eba18f9d1ac16c4ef5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c967d4fbe4208097d95bc1d652ee4922599948647bbde0879a0e2e41ddc096ab +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a43ddd3a5e8acbe29e33b90690b78baa024846b2 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_40_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4351025565a72dbdbb68d79e07b3d2377a5fc8a157b347db93732d0ed8aead29 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..82d4b1d705fda47f53fb7b2ae733a3c07e8dac41 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:83d0aa518eb48d9e70093082c38f3846890e5f413920c5241d666d3043efbc85 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..26fef82ccfdc910e0e2c32a7f00270e9d6e13f09 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_41_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:aa06d03e9fedba5524fcbfe217962c6e07a3bed385498bb92bb11a24a059650f +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3e911ab1cbad4ef837d44cf6c2ed58bece2da9a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7e4c7954687d479c1859d17c44901e094b7a448294ee2e1d03c8fd4fe7128435 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9e4a7bb884ae5b3b482df6428755f83b76e759b9 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_42_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:336158ebd4f90ab5f1106864b3e144fa7d0a96180672d82872776b7ce47024a9 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b80962b40143bd4d231ef2163520825062060500 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:46fe9559a1daeee48f03e254cc9f48fdc30cde7ef15c698cc0556288375504e8 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..dd8f9587ed1ff2cbbd24de77e6d85402e081b1b8 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_43_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fe2d8165321b7d5b512c34eb7eb47e7857dc90a4c1c131c19879c31c9fe6c9a +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..19a2218db4d3a86893869c3db752d42c6b721843 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a0ae2ce88d9baf316659f611c3bb2a991058791d7349e3fc4026b7e95ea0908 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0bcb2e2305bceffc1982d99437a4e5c0be944fe5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_44_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e40945c9314dab754e744338671358b70c610821812c274e974bd71178bed123 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f51d3a31d051c16675e494ba056401b3eec591f5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:031bc366b477ae91da7b89279f6c81c9c61d43eaa3c359724983db1fed384fef +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a08e153161af704c6b6137b42d2c0b7cef9f3ad0 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_45_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d755b200fa9d18bf5a20d3e929a2ddb741f59f0014250fcd48bb02da775bce28 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7bbb7efe5c871f7e9218aac06f64ec57ff23ea03 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2b4b581de4120bf13d8189e2b365358957e5e3f7bac09e032aada7bdc6190421 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f3f099025cb7a2e8b4a3d0123555f857e1b321a1 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_46_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:86210fa1d21a662c7be12567ea24944254c66bdc1c57db465578b960e42de87e +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45d7787c7dbf9be77a184b6479a41deaf743d8bb --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d58319d413ad3cfcea899b3ebcca1e84150517f30f641b0a827f5b19418ea3d3 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..58dc5a5c9d5ecffb0afb9d4c799bcfb272460807 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_47_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:de1b4f27225be8943e80d2f51a433b167f22a11333552b20c715818e0e754f0e +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a707ad92ec9037987aa63c7a599c8e07b54fc982 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b53f56ce3cc3e7ddb7e867847d0dd868308ecd23549f2d77e0364cf10e3686a8 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6075ff34551ba69a445294eeabf8b60a04897578 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_48_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d033b1f4ed334042ba924fbbf0fd93b03c534991183c82a3f9eecd808d0b8fec +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cf52cab93bd44ae85c4965f7e54d6bd728fbbf37 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:25608a9d09044bce7669afc1016d79bbc160bfdb6249eb605b8586c962101edf +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..317cfd9daa0c78228aea499e1589f1c697c77e70 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_49_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:338fca4db90c081de19ff80980440817117fd41170736e70c91d89ab1c022d2c +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09f3e3a4f172c8d6202d075f0bd655f28c025bab --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cd78c1dd8b823606dab1233e49f06ea7bc871ae41c752abf61176cc4d49bcccb +size 199058775 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51a16657470becd3698c3590204e0039fc77a037 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_4_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ceb1225c13a96893069e26419ab61dd3029ca607e550cbd29bfb22a83291036d +size 199058775 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4d6a794eb2d5a83d7eb2b47428c1f545e4c61dc6 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b1b22cee68827de84653d43514490350a3bdc835aeb62dba46d3b98bf8a8c04d +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6320c37648f05f161a9abd93a0afb584da583282 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_50_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b806ae3e49b41ac8e9a38b9a89be9abfc6fb7060fc16b62fa2624bf884b16540 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..35703ac1d5c7387bba72054ecdbfec1755ea7355 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:763ee866f7d04ea48c186cf772e491375ae20373afad4bf66aaf9d5c17e872a4 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5a690bf44f0815bcfc36d34a70f7f20e2c936bd6 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_51_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d3a585139fe326079a635961e8f5662ec0120c79fecbeb993eff3bcd547542d6 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c94d894ef48fa68b0c52d7c63bfae29fde1712d9 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:84cd7f8490d8b3a44cd8748b9ae1b07e56d4b529ad90dd0ec4dd1d95e440fa8d +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d71bc233bfedca34b86d21d2b9c95af695888a9e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_52_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:69b4bc7faf169d8edd7f58721b42c2920fca1e7252feb82c268dd90692ec31ee +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2874e60e0f4d2b5a722138f75def11f2f3c514cb --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54b06d6a440cdf4a5c215330850ebe7f84303ed4a420d176d6f33de54efc2f74 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5208136f4ed2974f1afd9085726f3f1bcffe9611 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_53_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:12d39b4567f8d87f05375d8b8a7800cc61340cfa4689c8e983c88180a2ab3043 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5932e4f5c2a9b413661c7fcebb1a38da7b6e8d27 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b5915680d8c268cb24ad8ed5c19272c668b261f4be0e037b000d24974a61397c +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f047d39d82b77b78c8c28028ecac25375d409ea0 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_54_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:47b5e667292d0679addcb663fbce6ef014aa68550f9b3339c48ae7cd100189fa +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bf76a9223fac1b4552e1bd27fbdb961e91b0a58c --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2fd0c687db1323f627184a5d17deec9e1268e91d7369e3d8af7ee5a29b0d98f7 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ec80dcfc26e6199f13acaa9d77b6cc6e40b2169b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_55_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3ec8d4295bb9a5ed67a0ad4730311e85dd606fa7693cd35ecbf013abd887fc79 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d32896a906da48917190c9f1d50b0597b8945c2 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9cce866df49a3a1c5b029a0b55b97eeb9250a04b8a7097cf2992a5a8995a3600 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..427e1ec555c18b9bdb5b5c696cbca6ccfd4ba36e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_56_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:927c19382bb09162175c09549085c249c5499a2abeb5e112ccc94ec3a29cfd4b +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2029447da5eb79707e4caa649f6ed78dde405c67 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d8bb4da0d653f2b69588105922226cbd1a1ac79b9c982c32d791a2afa880d791 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fb9def1e8224db3f40f3b14ab9b8988b16ced37 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_57_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fafa9055a2b88180e5e63937e4b239f0c6f10cd28fd1ae378b4fb88bb05fa66e +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..373f1806f69caa17c2e925186dc53486eb7ae714 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a6ea3517a169f952741b036270732abe5bcd46d412f1f571acb54c415d60f517 +size 199058914 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1825c38e7deefc76f72ba8d8d050a1625c442021 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_58_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c6de82f66d3990a4fba32485f5659ec9890063ad0864557947d6d4d34e39162f +size 199058914 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5179620883925993d268e5cabd978127cc8be742 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a55317a76f201c42222802f6cec1d88bbc0cd0841dc97903027f6cf78fe2fec +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..62e5e0fd01994f06706212be3e079e45bc2d6c4a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_59_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:758c42fac9db2bf6e2b629dd2c4ffb6205c8697a1ef9a028aa6dd604ce56d99a +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f940378aff8c980211160b5600dfad64b64bd57 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:552069ea9d0320634e2842c7b74241478b7566c6810d848470aebd4ccf8c9294 +size 199058711 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f62b98903c9f75d66f4fcf21a823483d2b3f77f2 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_5_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e7edee3a8531c9798d5152a68e79fa29c50bf43f0bf930ba7bd95b16fedb8650 +size 199058711 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..005f55869f9e2a910ef3630485f25a07540b7dc1 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07e445f9927571da01514834c175e31ebad900823777619b36d92ddffadb53f5 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c0264ea666c13398b5bb6483961ee56fcadafb2 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_60_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f42462d3ebdc12914a1885b3324b3390be325c0b05891380f96cc7eb443e37bd +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9914a2541f1f679e399f55dd2dd93da211f51809 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecdc9ac61e4fe9f84c097097f06a763aae961b3a598d3236705276719af4ca36 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..624209e18264770572243cc0494cef657fc7b6bd --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_61_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ca4da2439172d4517c1341159124c2ad466d225ac2b1c34773453d1338aa784b +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f18d0e15e9acaba3f0187e05162eef7ba820d9a3 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8dd0a3a98e9657ecb91f52d3b8f5aaba712a3c7f59c79cd6ce059aa74e0ceaf0 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b80305d25210dec149962407ac45a092f39ab7a1 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_62_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8ea9ec95cd1f3fcf024e095f0cea28aad3b2b9d5ff0aa42e90c6fb5b6d25313f +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4ebde891afcfca83a32da46d1ec55dff894e5afd --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0bd9b10edbcc035dfaf3c7e67791d61f3b59ee310d34eddd0475f8ff31e1d7d8 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..978b778c231f89f3226ade1d943e7df0c00cb394 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_63_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1375444bd4b8141607823628a8de2a84f800c84972c46db02fc9d00fffa8a850 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5bfcfeffcb44d1a2b84f9d7a10cb508b3ff0e172 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:910439a883a653df488d0fa0522c3c88c12eee62481f879811024b0533fc539d +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7ba1c3d215761bf6cd568e859a62bd21efce2b1d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_64_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f82fba09bc69490fdd30e0182b63a0d93ec36adcfceb7fc3787aa3e8cc9c7879 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..415c2cec2ca624dbb4be35dd6cf962d0707553bb --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3be15c1f6d574b53a3b6a39e23d53928fc41a8473438d125621715d97e9b5e9 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..355e2fd52bccde0d98e83a7d82f8d8d320737a7e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_65_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:92c2163a258b12b294817d63fe4cb3a88804640c46fdbf19b8dc667e8406aa17 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d3660d34a309d624e2067cb83ab83adbbcb9b243 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:571e50b5cdc9efa0040c5908f8759b208fdfa50c1dc98f89f514b9da380e53d8 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5131748498fb2b258d03c26b808151cf09a39610 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_66_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bdfb808f7817da7f8470af26567b6ac1386a3ff883822d2409c503212746cade +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..845364bd413b8d2fc479bd516bf014e53f3a978e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8405e4133cdbc230141f156103e0086391b71669438372d312387bbeb5c216e6 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..83cdf4478966fd169b9c6b969a6a1938dafa4f3b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_67_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0142e0cac029a07e70d7e388b3e25d2064bbe108500ab8a148ff97a225958f66 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ba64c29c05e3b5004cc2257483d6f0ccefb64109 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b6e00e48f7836c2bd741d5e6c259f287d4eb4498bd5b8dfe8f3096a97435ccb3 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d1b97064a3352da4d77de9584303b1633616ab9a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_68_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d62ed210fe20c195d144d52c7e20ee28f6f6e4cf6868a49aa396b9fe24fa6ca4 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5149f02b913fba9fbc13c790920f7ac647d03783 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:106f33da0c3e55a0e8e78c5d13963aa19be85a2637f7a93b9718865bed41b160 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e33b90e6bced4246b59a7d6b3541eb6eb0ca4786 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_69_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7d5c08de7560552328d7fe5b51870b8a40ab50b63efb0ce229da2f81e244d98b +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c66c70806f493f716d16d8f66517a78c00872851 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:980c6beb76ccd05039e01589791f8be548d189233546da8e0225eb7fe05eed99 +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0227c7829e18434cf184e95042d8ac28e6ce478b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_6_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b63bcf5e93c38f9e16ce27c4f5150a9cc32d022f44c46e19b1c7b37fbcad4d8f +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..06a6ace24fff0850cc806b13a62fe22fa1fc02a3 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81f9e787f3d08b98de5971e981015e8c9baa44f85f88183099d5891db594d949 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f931c4a326fda4979605d49ae77837b25233ea9 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_70_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5ffa43f4b2d58f99dd3e69c5f69b6cf621c069707c4fadd61176bfe744e8b5d8 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f0e10c5cdf90fa51036cd503d87438fce9462959 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:63d39b162ae9e99f1e4860a174573a21e36aeffd3331ccca7b665629e3420301 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..92e2407e6525724f0377ad6cfda36c4ad0e4ad29 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_71_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e4ce349407478cfe0db1549bfd4e93f514aa72d869ed8cded6e2490b612a5b18 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9d43940b969119838d56b1404312e2433fad308f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dcf730899f219bb4d256e33ea89ce99f7881b3a2204205fe5984ff1fbd90a5b3 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..54abe85aeea8ac7d52c3f44b9b8766c21f8d7ebb --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_72_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fdce24a7629b132f5aefb7e65b301924e969c4d353b7b986ef6009e5e06de285 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23b7aceb38819cf8dd70b5946bee3545a92949a8 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1b79949508a22c0a063d3fb220f2882d9e15b61bcdedbc10d2cbcc99794075dd +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90db14b07009a12175828cb1dc0328e9a80b7d0d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_73_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:09d170c4fa2163b12a96f98b6453ab874441e82ad20876fbccd72c0db2ce3e8f +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d65da0b7fb40c55a50cac774b90bf67fcd3ceb28 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d2246d9bb210a2462ad3dafa5fe7be0ba84ce4f64c026f3cf2f88618e9d11152 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3b5f4b8aece519ad347ecdaef4b3121201910626 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_74_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5770566e118c676383ceb524d6a29a14df4b1cfa468d37d5870078c009ac8bc6 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0733cbdeb6c3e00ebb3dac4d4afa3b8382fbdf4f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2d859c98bdd4027e72e4863ffacee2510241c6e0e6bb86b9aab2ad16ea512061 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5c4f117db96a954f04b1c8257a7667976c88fcc1 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_75_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a2f52b96e146f1098c73bb0df00a15412ddf8dd33b390ccce035be206d96be32 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..76e7962546023d7642354abaead3c94e29b32e69 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556c1e5d2acb53c798d047ea7562728feaa1f2e727032477ea5709e0298dc92b +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..722f27aac7942de4aff29bc38f1dae9d0463ea4b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_76_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1a26d2caf4c9d4e0d6d419364a5ba0cc0eef2e27d7290ba5952fa5fc5c2bf831 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8d2b0355fdd28dd06ca6ebc9456abc30f9f6c4b9 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:76c5b631f02b750d69308f0ada009368bfe1f3e42c0001a7508743dba812a65b +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..10be939b195a9c322f49be7833384fa0e3abb0e6 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_77_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7228ae471848dff48362f416b5735db2527bea42a0decc2c9c2ae423cd06b751 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f9267ba0a3261ce73caa129d62fd81aa0059f0a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eee5f00b19d362dfd206dc2c6809cdb347b7a61a9958b1d411014dda33e851cb +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bff4dd97163ea7f48ca5721a3bc04687b7835ea5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_78_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f532191fd00c3b3ddb3d07518c9e8318843121dcffb0fc59b55362cbf08080 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6addcfd45c689bd56be506db6ec336da9c3778b7 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:529ca4bb06b1e2b84560ec85827235cc67106e6d6eea0640609852d1e6d9dc3a +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3afca6d6f09951ee06c03bcef0a802a3190e1860 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_79_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b8ed5988aeeabb1a827e713172cb771698dd451e38bdd23756b4fccd10707da +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..60019f9c3fe33f24b38056328ae024ae66924e39 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:35fc4d294f40c6cc94470d8dd33458ffa53213aa7e735f9f10e557620680d3b5 +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d95a0f68fa65facfd6b508430667373c1b224a24 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_7_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4761a2ce78ace18749281f8a099c7523bf148501367bbee9c28106b643968a94 +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..853356f030d000fba6dea9689324d278be7b9cf5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:153495c2a2ca303fdeba47ad494521865d086d65dd9aacc24ca9150189def9fc +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..20eed394d94adee53c4199213786709fc7824d1e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_80_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e683cec49e3be8d0542f41dca8b447ceb45df460dab20d594b1f2923135e0409 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9a3d10ca2a13af43c36a9f3625c824a6d9062737 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dca9b74c3aa56c98606f5e37015fb5351dc232a487c1a75a5f5f6e717bda87fd +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b65820ee990542540db6bb208283d0d59a2c8d8f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_81_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c520c48d0bf94a4175dd6724a5cecd9baf5e4efcb9a504f0ff5d3a9d2ebd07c4 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..087d510447f6cbe6819bfca03bcf1515e5b88391 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac1df4fee317a9f917ee95fc885077d74807f0700fc1abc7524304143a31559a +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..31eea0cdff9facba8635b449b90e778a442c6148 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_82_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f79b58677bec6c780d97a02e85503c470b46eaa4bcf130d06a332b03e49de4bb +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4a7b4599ffab5750a7b609c9ffe89f23a79d337f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d1aa0ab54000b72ef1a91abb3deafe33a8ac7981a4f6bc97eaa5c8365337e51 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f35676e097c53116053164e3264f2f777ff9aa38 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_83_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a7dc168fbdb9b868580274cd0f653e396b73bd473dbffe897a88831f6823a80a +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e4e54c7d60ea44642aced7c1da2143e9e321194 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f8dbfc6c9d8d948c0681b9cd24c8f852e19e274fa99da1b1f4ebde48038ca0 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4725f92aa1f4b223d5fab345f60a910bcb0f407 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_84_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a3968f2f4a019e16dda58a0e73712545becafec437a199ce8f9a0c79d1a3d57 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a45b55e10a4a7391c73a45eef0188ad99d040d37 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ccefa604efb98d071d2fb3b591191e838140a49ad015a1ec9e68bf4b51a5244b +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..72e43e7735f7ec63f35c119c6cbea8a8f05ee68e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_85_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7349a388a11f5a6338f432ba1d0dc327790a474ee365dd3a5782861ef5a384f2 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..de3887851fbff516bee9041a35c821847e84ab14 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4c85e370c3e894b7f9ea5aa2b2e4188f11ed30ab30e605c421c171ed967a7b1c +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3d6b23f70886b6b4e6d0fbf145ff3d120ecf3f38 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_86_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:830c9d0729b1726a27d9d69a57564daea2046d5d1ca565705f137526f7b1f050 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cb86a1ff5b5a2f972114d2e139333a0fcadad8da --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:20adbe3a5fd4dd0c05080de1e52b8de9d65454eaed654919d140b512d178c0b3 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0939b4a3b788b1e1e58974e6f3b1690e7c9e005b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_87_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:061d028e6dbacae1fd3eba51d92cecaba90b0b07ed4b79774b485e65252c1797 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c1dea508f21c8866fc8ac72bce874112abc70b7a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fa699145f9ac5dff49cf5803ca7edb30e9349006ce636b20946fc17e9a968c5e +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..09269d3afbd6ffb12c4947917cc1574e097dbcfd --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_88_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0305809d9f920a357c9ba5920739a3c5d901dd3733c29fcc365d3cc9ccbeeb1e +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..66605156a3d720435cedbc3e2b6591048ad62f91 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:491cc2fb2c60cd9c16bb035eaa2906b31dc712e0293c6a9922065c88665e61d5 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29fee8d462dbe5fd25e325bb69048e74a2cb270e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_89_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5f8f5951161b03fb4945b265b6dbc05c5f9ed6b6ded6986d73a12e4cd210e8d0 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1740baa4ac266110ba9521c4a6c785daebd651f0 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d7d003ff7445d6ceac723444cab3fd7f95bd4f22468c72bbdfa62b5fb571da06 +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bd203fa9c3dd24e68cec15b0480f9ea0aaa17f99 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_8_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3041a0bcaf503433c0e355b05370a4bfc5a62d1bb45ff30748abadae2c14e0ba +size 199058647 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..68ff96ca1ac522c60d1061bdb5d2c846b2cfc849 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3ab466971a8df0a06d75909e9ec27ecd3860b3555990aaaee48a70f77321031 +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0af8bc219f0fb634baf1014a776e8fc5ffac0622 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_90_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3089f7c9575655afcbb5ee61bcbf77b82cc7d63da3cdf3175dc6606e0f61dafa +size 199058850 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b336137cf2cc6db7e1657e4c048b68bb3e4c950b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2f712b289efcccd1883945a1608aeb9a151a676456bf3c8e1c51e661198b298e +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a43a352e0f4b7df5c4d34dfe71391a177381b5aa --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_91_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:97449b2fdcfbedd52a482e57f4d1e31c0463902b19077815dcbf7c0efb762ca3 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4432b9d1d34bc9396b82a9ba39aff9fa29ace89a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a949ec01b85ba6898bb390d653eba34cf5c13b3ed2e173a706d64def90ee80c8 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..45dac42001129f0c969a8e19aecad4b72a5af190 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_92_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f90e271c2c2357f69c154641119e72fec7cd233a08e8391168423d1fdba5e77f +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29d275ad2ef31b38b3b420eb5cf9ce2a7bec064b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ebae253ae3aea7f324f0e0e884c9096d1c90d7a0ae8ea0044a32e3920af7b33e +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6cd0931538440feda9f11ddb3aaf68bda01a643c --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_93_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9d137d67299e974a0c1b0a6ceebc36571be3ad9585afffa6ddcbd1f2ad3f2123 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fda78b113d67160c9506b11548579af11d51b12a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06e5451655a3f281e88e9edc6edd4224319b8befd93702d20fd78b578ad9688e +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2bb3d6a4e09446656d1045e4c5c91ddac84134e7 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_94_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:07d5f9fb6546c606e65a85573c966ae84d31b4bf3300bea6aaffedc32f82bf91 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f5f3b04404e53f67cf37520f19c3ad16b7b9b105 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f03ac01852bc468e39bfbf5935f0cf137e54b7b655dcb690c4e0147b4690b408 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..7d8bdc7ba583e1021b7408e6012b39108e911f1a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_95_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cb27d96969e6eb7d1ad1aabbbaf2e13afd9d2cb42e409cab88b9da6783bbbf35 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41209eebe3489ba8232ffabaec87a65c2402cc9f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:eaf27dceb853a23be38cb93d70178871b7e4628985afe85205ed410b7c3f62e5 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c42317ebf2e5ae6948c533cd2b3dfed506e4a733 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_96_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b12020a23083e5858ac06714e7ca5e991601a65dbab4f340f4be8dc0f7f5fcf9 +size 199058722 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3f4a8335fddc113b58f9de450b6562c103bbdcd7 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ecc352e6bfc648df97829334e20e469650985b2819e1a23b16408b0268c3389b +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fe595e53d9c3e3cacb4d6d465ab22dbfa95d61f8 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_97_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ac347777f9a63502efb5f800ed8cb6b877b0582518b7bf14bb85de17c7026df8 +size 199058786 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3a913a8ec797dff79d42de1c487fd5fc0c67caab --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7993ac232bcc9d12e17a306741340279241ed76c64af5c805388d51ae153be79 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18391475d24253d46a6530f6893ba8e3867622dc --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_98_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0a728e180c0d1b41befd80e904653686fb00c538d62d9a3e8eb80a6d9de3f7f1 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..93a6eff7f0aff289db2b05413a1e96eeaad981d8 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f86fa43c4861e3268c354aff77c173298e04f4a73fec68453f24f271e401ca59 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5b6463f724cbed771b2e89435ce37f59c2e44f44 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_99_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ddd2fb5ef8b4f3c18f7aedb16273ac29b6cd8d435abe078608972138015b8584 +size 199058658 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..18c4c80516e7606c5875a33d54fefe4fd1aa741e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_00_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8a0f346a2449ad5a80161c407b1d0aa1a740776f3bb30a74ec567a9b3c1a7a8a +size 199058839 diff --git a/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..aa6d369db06518c9c2bfe6f9a4001ab3027d7562 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/bf16_zero_pp_rank_9_mp_rank_01_optim_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ebd951a2faeacc2af8d4f7dec785082f4406069cd07efe4b533cb5b18ffe8a5 +size 199058839 diff --git a/4b284b6bc4seed4/global_step80108/layer_01-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_01-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ac040c2feb56ccb37c305530cdf74e62671eca2 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_01-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e3228cd9f8deae6b875239ffacdb48e95eabf7604fef2bd572fdf4a19d575553 +size 167511299 diff --git a/4b284b6bc4seed4/global_step80108/layer_01-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_01-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3c383944fe0393c2c65c78c23bcff66ab1ae8ca9 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_01-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c3cc2a94a3fe66300d21e59b2d2059cb4c7a4e244d8b00401ec9f3efefd46147 +size 167511299 diff --git a/4b284b6bc4seed4/global_step80108/layer_03-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_03-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..99af33085aa38fcde3ccc00bdddcfd908d6520ea --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_03-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:301991e2f165b4dd63dc8f999597cd6fc4160609f6808057857ac61c068eb776 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_03-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_03-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..448bc3f68de1dccfbd76ecb16a49ff5552341c6d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_03-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58aea38aa576ef71186d8be437ff2824087a82ecd4654d0a3417309567bfbbf2 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_04-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_04-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b16b457bfd9f1126c5bff36f6898f974a56fc64d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_04-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df90de458d2a53639bdd43e4f3dcc1a6d3ab0950983d58b0ad79d87ec38abc93 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_04-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_04-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..81c6a67da58a3322de1c2aceb4e7e97ff2f6794d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_04-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:556830479411b91c4d851858a3d9bc67d05f1a7fbb678f62d8a6b197b16936ff +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_05-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_05-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b30853bc786b8e6bc7aa3312d363c413f04dc575 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_05-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:da918df3984c0941341d0da95e757fc492cea236c449d7ecf2a902aa2d99930e +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_05-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_05-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..e8ec3750d04faff884c10b6ad01d6f6ec8390f05 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_05-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d9482a08a342411cdb03905854f0b7ce470614a6ebdde342c35c1a0a87edb56d +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_06-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_06-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..29a6700e5ab2c17a3e684a53c7719e74f0a1ce09 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_06-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:93006313ed387571d5f8103e00ce10b0c1b4773f99c3c8a142c46c2c35a9bb1b +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_06-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_06-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cd71f1e3021f461d8df8f0feb407900c376d94e5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_06-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:31333022e6424de6308cf4f24a9a4315c219d71f87f3f03cec660bd225b0af5d +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_07-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_07-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..922bfac9aa71a0f1aab36a94ceddf4aa0489002d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_07-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8939c3ed5736beb2588a716e108e3028a78acaf7237301a99037c8d8a309b723 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_07-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_07-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a19be3646906a76515782628cfc812aa6ab00c2f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_07-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:81952a7c2a576d166ca48173168022ae4607f13b091ae6f380f5b5821a52c76b +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_08-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_08-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..02601761324d1e42633f9342c2b7425be6035014 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_08-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2faf055743c63a0327e338815d142adf92e6aa8ddec20b33f1d5a5f386f35657 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_08-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_08-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..468ef7ee914b4e7893999d7f487ca9a208cbdca6 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_08-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:542ea40c0ee10a957a07c1b50f486bc1f1b81de800c39cb5d85ca19ce53a7eb8 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_09-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_09-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c2677052c8d4774ffaee9efd605c4d0b868855f2 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_09-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:58b581bc34dc67e1f49a7ccaf5b7faa494773da10d367686bd2f3e378ec72107 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_09-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_09-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..cc16339da1034e62f41410a12fc9ea28d6993035 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_09-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:833a835226e07b64e8c5a06cef6d3b127995e77c685b311b731e31fadc055dd7 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_10-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_10-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..23a02770d0b705a4adcd89baad74e9b6497ff3e6 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_10-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:9e1231c64187bc1b0d810b3e6904f7fc52055ad4637e10da615f8d43b9119f08 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_10-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_10-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6d008f220f75d11b600f907ff263a71377d9b57d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_10-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:37ed8225543b0c20e8b8586ba29849033d7bed3d82ba14ab793b1bf97fe53b7a +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_11-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_11-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0fe874f47d499659712a5e5a30da399d3c698658 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_11-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d700bf1fb7d32248f08feba7c9b582dbfea1ac0b82c796fb085ecc09a06c7748 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_11-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_11-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ed85a3876da8ebe043e80a000946f37e9d0025ad --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_11-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a22cdd007c805d8be9e5bc62e733dde2e9a4791302b1449d90b9078e1bc1d519 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_12-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_12-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c4c5acf84ac709924ca767f62cef6fcee8f05f8e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_12-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5183aa2939ba1064e521dcb7e0fab09e6cfbae04568c678c001d84ad510d93ac +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_12-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_12-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3775fec3a15b082e6cf2249894629d64cee09b9a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_12-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f7ae7d00eb0b684175d80be6990f2bda9a4d2d2ccd4c8410a4f9987b1dba1d69 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_13-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_13-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..41a9e0743d9069d06e81992e9314f6f9ae2a97e0 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_13-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a678855d9980ec56928304760bcee4fa23636f998c7e5dd240af7b786ca0f029 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_13-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_13-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b565bc90c3df7e0cd38b2aa4eae836f94343d5fb --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_13-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08a610f3d5212eabee648e8738a18412f1b2580060d4c1f4c91f937cdd3b02d5 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_14-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_14-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..16e5767b3d6b28f10031d980a9e34e4cfd7c265c --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_14-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b46d291755643c6007fa603eb8654423b2f33ef42b68a996272ad3a7d5c87ae8 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_14-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_14-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..368a98433cf804c8f610045ded873dec6c2dd2d3 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_14-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:490f9a2d3bb140021e0b340defcead36b008dfd46121bb203a0c04c714df5964 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_15-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_15-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a162fda62b86d44d93da2aef4c0b9c0e68c935f8 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_15-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6a58a2956e4510990358805269cbe2b0d3c23a3d0f7352fbfbf20c6b4fb045ab +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_15-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_15-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..664a5106e3963ee77d11f029f47768170528bb83 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_15-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:24450c8570c1793f942c986638f6c6a74c08aa65a6dc08843e72d10c4ec6e539 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_16-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_16-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d31200e0b8036162e6a840c88826d5b3ff00dbec --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_16-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:30d11f0b5842ab67eab3e1863a13801536e9163a2970a65968946ee878e73c91 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_16-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_16-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..bcc26a20ea6b6c8c72f8d8d411068ef163a77e80 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_16-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:697ba5dc341168ca383b8b35849da1be56559877d1136ff33002ebdbf0784bcd +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_17-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_17-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..43bc92a0d3f262deaa375afb7b4c6e7ddce86a5f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_17-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:cc4098c6b7f0698a9ef57e9aae1118b313357339d2a36cfbe9c452ac9159eb62 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_17-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_17-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..40c8f729b5919907714b06b9a7c3377f98eaa3ed --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_17-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e39dfecf7e005f9f275db05e6c306593458c8be81f1a7b2e626debc8230e6006 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_18-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_18-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8ec57ccc47712688e2a532267e4a0c87ab5f0384 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_18-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:df8d43598bf07edfed308cd383265632daa4bff362f47ed8c0168798f6f5355c +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_18-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_18-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9395ff94902dc69101608b5e7fe8d2a86391dd18 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_18-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02394b7e3e29c940da980218ca0d95b8c3e17f19ff2c864512c67d928ea9a02b +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_19-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_19-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ff0590cef27764a5290f95a2ea3caaa35c2a83a9 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_19-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8c03f32a50fee7a6f21dac60ab8f77fff59d33f3436261f46cae7a83f4481bb1 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_19-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_19-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..61da5b721b1366da91ed964516ae19abfa3aac66 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_19-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1e5ad9e942b6abfc9e62cf15d0f53a3b5c1f63b4187735c0d91aea582c2cba23 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_20-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_20-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..39bbd9e5a2c7b811645d25ef48fc971edbbb8bbd --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_20-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ad75fbf5be41b02dbee184adc50b6d8a36b1efea17ca7798ad5a0de5173e846 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_20-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_20-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..9c5e4d4278c4910001654980963d828c40bc5426 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_20-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fb7b05ef94673960436f8ba519f9f54a8827a6bc61ec99e45ec873d1ff464b8c +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_21-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_21-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8760c8c48730ecbf0296f95b3ba29d215d3736df --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_21-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:185d8e3600b30228ad8759e54b484b5002cb795ca4bb557843acce2ef0477409 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_21-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_21-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3ad291fc4248cf923fba003cb3bff7ed8992206c --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_21-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:02512d0ab7de4a95dd65fdc1a1ce82ab6d1d8c84cf501993e4f7c19d43fd19f4 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_22-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_22-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2d690484a3b4b1cbda0a69bf6b802b1248714955 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_22-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2c04d63f5e41b0c866baa02256494db87ba0d72a08295b60b93e341bafcb125b +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_22-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_22-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..fa8a5d78ace671794901a25f738a178b6e83afcb --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_22-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8f8c30c450b2a924c1cbd655f522cbb78aaeb8ae004f564ca1c128879f65e939 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_23-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_23-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..0e9d5ed6f28495f1b8ed61e7c27af77c6e5b4911 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_23-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0d683cf549eca1bb536a2b2b06e553d731a5c5c349bf1563b93ba2b20f500c12 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_23-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_23-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a809212069892e10a9258d09a096d8cb18b75754 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_23-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5258c50a734ac9490139978a458fc23794f8f0287225decd4fcb36c21e519804 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_24-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_24-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..874380fe62cc9c76f7ee583edfd159ef00fe7ab8 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_24-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08df9fbe232906b5e4fb988f794a8513906ddc3d2765b20d66822b5d80f7ab91 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_24-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_24-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..12c1ce02f195c62bb87998998c21569a47a52eb0 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_24-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6e62ebec046d52fa23c2f55295593edc842e21b88788089a08181c90cea59ff +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_25-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_25-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c173d5440d396e4b69f906994c16f2b9bf671761 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_25-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:476d32b94def38d5bddceee47eeae2f3cec1c39be7259aae729ba6bb1c0056b6 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_25-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_25-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..647af1a6430e85d5b893061da0bb4a9adfe4016f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_25-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:bfcd8304d590bacde986e5ff126ca79738384dbe2bff62d08a8a9ea81ddc61d4 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_26-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_26-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ac4e6dcf8b070a481aa94808926309e6a501f185 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_26-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0867da64d7442f52b61a2424c8ce9c2290ea1c6d2746f4ed920d266d782f344c +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_26-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_26-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1c7814fac80e792f6ab168cc837a2721d47e6cb5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_26-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:ed6d9a4aadd9e8c5a1921af39311979338d91824aa9ee5173c23266532111f75 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_27-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_27-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..ee4bb0fd68a08dab6e22c60846c56326b6fefec4 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_27-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:893a3fb745bc9531f435766f53f0a866e2c17705c223491966376557fa34ace1 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_27-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_27-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..5928a064eb0afc04d0e18b78643e7dbef3f6458b --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_27-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d08dbe285e3c70eed8714005eb9d85f780655a320e92bf0be6896e54b655fca5 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_28-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_28-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..129ac21bef77f1e0199b043fdee75e6521f272cb --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_28-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3bb73b34966ded50e3484c127c71553f5d2c02ab8034c8f7408c37e61930bbb1 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_28-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_28-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..1f064fb080cadc3b005f95575a9d716140f84d3f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_28-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f225de18dcbf9c9a45f5c4930a1885ada784098f9bea3562a8769af661f93d06 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_29-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_29-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..386fa8376930054019ae5d59f61e4c143676637f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_29-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:4a9dbc04eb26bfc8cae311a42c0be70e9ba39c64ceb4d040b8b641b8cec8044c +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_29-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_29-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3dfd24540c74a01bcde60bcdca72f846ffaa513f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_29-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:fe94010974cd65a3f0c57094c5019e69e27f26d444163f121d73e4cc0dfed614 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_30-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_30-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..3be82afd03b94be58f19f0a04d1ddda33fe3922f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_30-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:f0adf657d3d8da93144282eab3488bd20e4e9144f15b03bfdccb5fdac8430bfb +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_30-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_30-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6e2e74f8dd4e0ae16390fab9d4f034cfe8482ace --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_30-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:22284172001d7860cac10115c2765f822c08b09f44f87e6821afaaabc686fe26 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_31-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_31-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d5dc55b9bdfdac4c35825f1eae3758fb7f0a6857 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_31-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7645ef024d0c858f3e222625f5919dd8d0285cec7e1162aca37b90c90a99a8e6 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_31-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_31-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..b6313f0ca760b8177a89487a291d8e24666094e9 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_31-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:51fb2cc33aa0723463e8e521197da75072177508d97ca35c1d4912c363eb63fa +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_32-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_32-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a4119ef979fc1c399be5bebfeaa3eef70cfc2cb5 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_32-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:2ab676edf0a0eff810999e1838dabceff009facf4cfb87002bae38fee0eedfd3 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_32-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_32-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..14f88381e7ddcdfc0f662c2fe5f6aff68e38e763 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_32-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8cf91c29a53078a5cc5a465f3dc742d3c7c49e73cbd305b69750ac0733b71ab1 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_33-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_33-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..afe85cce6890e3149184b7b50b9564e67ea0753c --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_33-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3db5e7d704329c3cef10a77845dce042325eba14b29ce5418f1e4689109b2f75 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_33-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_33-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..4fa81317bc2c6667a41cb8cdd592893bfbba5c4a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_33-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:b2e7615fc92bceb08fc675ed56cb9e9a4cae9fca91e66eca1e8556d78d7210c5 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_34-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_34-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..49647dd6b97c9ad2ddcb34c1c5ba0975480c448a --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_34-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:3c9b4f03b30fa141f7f2d92eb9a445e46cd2c025fd01f9b276368a593a681427 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_34-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_34-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..f9f90591fd3ac1803fc18a49038f45a4032b72a8 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_34-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:012931d0f302f56e3949ba57180a76a60353bd7233c0ff783f63ab0ccc4c2fa8 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_35-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_35-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..6f61351d5860236937fbda9cd7629b56295e81be --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_35-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:278f38957c05ba1817c25ac141e68b63c467a4519a1dea2309392ab1e3dc1247 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_35-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_35-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..51b9511e4d1e7fc68ff46aa5b4cf77f038b2ab0f --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_35-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d276c4cf7a73dc6b2ba5ad1c5cc64f8a7dd856420f0f81dc24e0ce570d4a64b4 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_36-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_36-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a594ccf8b9a944d2a29d67ab8f5afbca32f7578e --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_36-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8d438036e2f18d30b0d23248680dca497affb646c5fe136645d34b47109f9cd4 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_36-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_36-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..c8b7368f83648672d07787a93794182dd2f37923 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_36-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:95b84c28a54f35be4391fcc79930ec3f558615ebb1c770e31801a95f2d591b54 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_37-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_37-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..90d273290a27c503624a0aa1fcc9fcaba413b763 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_37-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dab9a9479a1f534c9b6ee46ab5142b3cfd41f70a7289ec040cd56ba8b7d3685d +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_37-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_37-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..274a3d3d5785f961021cc85d33db0ab3a73e5bdf --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_37-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:c18db94e7a8fcdc61cccd5ed20ddcf9fd5fc2f221673b44763bd57f9f005d9ef +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_38-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_38-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d6e75f18df3412f81e1850d713e2cfdd2ffebc08 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_38-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:6e6d20d2786f18361f21b920b63c9ac0698dba8e835e3f7df11f3009917e5877 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_38-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_38-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a26efb0bdc0c5cbe76689953d3286fbbe8f27077 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_38-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:d6f78e07c97a26d34783875da3becb859d9c2f6c72bcacc2aca7d441029da0d3 +size 113308931 diff --git a/4b284b6bc4seed4/global_step80108/layer_40-model_00-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_40-model_00-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..8079375c4a9bf21cbe3c6a36e030b88a406a2a79 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_40-model_00-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:59f321477a5330c9afe43a8f2689d1d7ff3afa651e2f61ff04a3fd2526c3263d +size 13507 diff --git a/4b284b6bc4seed4/global_step80108/layer_40-model_01-model_states.pt b/4b284b6bc4seed4/global_step80108/layer_40-model_01-model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..2dcea1b9292e99b62f97b422a3b94d9806af959d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/layer_40-model_01-model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:997c2a8655c52d4dcfd91f9ab56987d0d90ec78fbe3c209146181a4d1db7360e +size 13507 diff --git a/4b284b6bc4seed4/global_step80108/mp_rank_00_model_states.pt b/4b284b6bc4seed4/global_step80108/mp_rank_00_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..a140cc0f16bd60a04a5fe347e526880457e5bf80 --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/mp_rank_00_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:e8c2f469ba5fe0ef0b4e76b654329225f3bed0c7a14b15f9acc2947c5a57814a +size 51443 diff --git a/4b284b6bc4seed4/global_step80108/mp_rank_01_model_states.pt b/4b284b6bc4seed4/global_step80108/mp_rank_01_model_states.pt new file mode 100644 index 0000000000000000000000000000000000000000..d54e55e79de3c49508a2c3b0887dc9445c88399d --- /dev/null +++ b/4b284b6bc4seed4/global_step80108/mp_rank_01_model_states.pt @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:29478fc71f750404953acc619040c093419b17e0fe654270e740d31c7122d9e2 +size 51443 diff --git a/4b284b6bc4seed4/transformers/config.json b/4b284b6bc4seed4/transformers/config.json new file mode 100644 index 0000000000000000000000000000000000000000..df814c3a71ee49044410636b5eeb4f43611690ba --- /dev/null +++ b/4b284b6bc4seed4/transformers/config.json @@ -0,0 +1 @@ +{"vocab_size": 50432, "n_positions": 2048, "n_embd": 3072, "n_layer": 36, "n_head": 24, "n_inner": 12288, "activation_function": "gelu", "resid_pdrop": 0.1, "embd_pdrop": 0.1, "attn_pdrop": 0.1, "layer_norm_epsilon": 1e-05, "initializer_range": 0.02, "summary_type": "cls_index", "summary_use_proj": true, "summary_activation": null, "summary_first_dropout": 0.1, "summary_proj_to_labels": true, "scale_attn_weights": true, "use_cache": true, "scale_attn_by_inverse_layer_idx": false, "reorder_and_upcast_attn": false, "bos_token_id": 50256, "eos_token_id": 50256, "return_dict": true, "output_hidden_states": false, "output_attentions": false, "torchscript": false, "torch_dtype": null, "use_bfloat16": false, "tf_legacy_loss": false, "pruned_heads": {}, "tie_word_embeddings": true, "is_encoder_decoder": false, "is_decoder": false, "cross_attention_hidden_size": null, "add_cross_attention": false, "tie_encoder_decoder": false, "max_length": 20, "min_length": 0, "do_sample": false, "early_stopping": false, "num_beams": 1, "num_beam_groups": 1, "diversity_penalty": 0.0, "temperature": 1.0, "top_k": 50, "top_p": 1.0, "typical_p": 1.0, "repetition_penalty": 1.0, "length_penalty": 1.0, "no_repeat_ngram_size": 0, "encoder_no_repeat_ngram_size": 0, "bad_words_ids": null, "num_return_sequences": 1, "chunk_size_feed_forward": 0, "output_scores": false, "return_dict_in_generate": false, "forced_bos_token_id": null, "forced_eos_token_id": null, "remove_invalid_values": false, "exponential_decay_length_penalty": null, "suppress_tokens": null, "begin_suppress_tokens": null, "architectures": ["GPT2LMHeadModel"], "finetuning_task": null, "id2label": {"0": "LABEL_0", "1": "LABEL_1"}, "label2id": {"LABEL_0": 0, "LABEL_1": 1}, "tokenizer_class": null, "prefix": null, "pad_token_id": null, "sep_token_id": null, "decoder_start_token_id": null, "task_specific_params": null, "problem_type": null, "_name_or_path": "", "transformers_version": "4.25.0.dev0", "n_ctx": 1024, "gradient_checkpointing": false, "model_type": "gpt2"} \ No newline at end of file diff --git a/4b284b6bc4seed4/transformers/pytorch_model.bin b/4b284b6bc4seed4/transformers/pytorch_model.bin new file mode 100644 index 0000000000000000000000000000000000000000..6e49168dc0c2ed2d5c2013c5dac3581d382eec04 --- /dev/null +++ b/4b284b6bc4seed4/transformers/pytorch_model.bin @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:0be9effe42e908ba56784d0ed1493f3d1dccb319fc53a281d46937fbcb3f25b7 +size 8781203669 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed1/events.out.tfevents.1682757428.nid007161.56631.0 b/tensorboard/tensorboard_4b284b1b9c4seed1/events.out.tfevents.1682757428.nid007161.56631.0 new file mode 100644 index 0000000000000000000000000000000000000000..44d12f4fb48895157de7a76f9b4571e72c58cad5 --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed1/events.out.tfevents.1682757428.nid007161.56631.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:56f77adad526640ce837df2c4f03eb153f1c04c522f1d80a194e8beefe16ddea +size 112494202 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed1/events.out.tfevents.1682952732.nid007164.63572.0 b/tensorboard/tensorboard_4b284b1b9c4seed1/events.out.tfevents.1682952732.nid007164.63572.0 new file mode 100644 index 0000000000000000000000000000000000000000..4f78a15abde1d955193f442660f8071c795b374b --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed1/events.out.tfevents.1682952732.nid007164.63572.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:dd25eb8d8a485c150b82527376e2688690b0b1475da905c6b51233bafe6feaa6 +size 36156580 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed2/events.out.tfevents.1682758492.nid006803.26040.0 b/tensorboard/tensorboard_4b284b1b9c4seed2/events.out.tfevents.1682758492.nid006803.26040.0 new file mode 100644 index 0000000000000000000000000000000000000000..1340624248068c6fbf7d87865c30cc88b3e72eef --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed2/events.out.tfevents.1682758492.nid006803.26040.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:feaaea6cbcc29e38396b7d6849682510b1d7c26c353a93cd8c3cb74214314531 +size 179430 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed2/events.out.tfevents.1682758900.nid006888.75259.0 b/tensorboard/tensorboard_4b284b1b9c4seed2/events.out.tfevents.1682758900.nid006888.75259.0 new file mode 100644 index 0000000000000000000000000000000000000000..82cdae95867c62ac9d29293add9dec0786baf48f --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed2/events.out.tfevents.1682758900.nid006888.75259.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5c263daf195f37a46120224ede8384fa741b59db07b510775cb6c425366b7e69 +size 112459857 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed2/events.out.tfevents.1682952732.nid006401.97014.0 b/tensorboard/tensorboard_4b284b1b9c4seed2/events.out.tfevents.1682952732.nid006401.97014.0 new file mode 100644 index 0000000000000000000000000000000000000000..808c35bfa6157a9b561228b21dd432fd067e6ba4 --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed2/events.out.tfevents.1682952732.nid006401.97014.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:148db22e10f2416118c52b23a27361d14c3e3637d8e464c0a6a548eb7aef9c43 +size 36156580 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed3/events.out.tfevents.1682758523.nid007026.8788.0 b/tensorboard/tensorboard_4b284b1b9c4seed3/events.out.tfevents.1682758523.nid007026.8788.0 new file mode 100644 index 0000000000000000000000000000000000000000..1ad85ba092248d0689838ea7cde36458bce35ea9 --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed3/events.out.tfevents.1682758523.nid007026.8788.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:654ea7780b9c3e2fb0b17cb2b49a6c65a20010539ad91e1f6b3e24d92a949eb5 +size 174614 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed3/events.out.tfevents.1682758900.nid006803.31946.0 b/tensorboard/tensorboard_4b284b1b9c4seed3/events.out.tfevents.1682758900.nid006803.31946.0 new file mode 100644 index 0000000000000000000000000000000000000000..c98755356ed7b3f06e6e6aa1d48f662cba3368e1 --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed3/events.out.tfevents.1682758900.nid006803.31946.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:638768b3742f6df7850b65669942c335f20dd4379b486cb5c2189bec8f4950a9 +size 74814010 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed3/events.out.tfevents.1682903697.nid006977.19250.0 b/tensorboard/tensorboard_4b284b1b9c4seed3/events.out.tfevents.1682903697.nid006977.19250.0 new file mode 100644 index 0000000000000000000000000000000000000000..e60448897d43b733bb872c312dab2a0c1a1aab6a --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed3/events.out.tfevents.1682903697.nid006977.19250.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:7a5774d985de14601ecbc479fc9f078bdb99c98fec8ef721528ab3da1530af7d +size 72098300 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682758618.nid006097.63452.0 b/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682758618.nid006097.63452.0 new file mode 100644 index 0000000000000000000000000000000000000000..4dcb32422db04984293b52a843375018e5a6a569 --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682758618.nid006097.63452.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:405f8a2f77ccd444d5932c313beb7fdc76b51a26b24437a72e27955614885f82 +size 133511 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682758913.nid007026.13891.0 b/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682758913.nid007026.13891.0 new file mode 100644 index 0000000000000000000000000000000000000000..23e3b23f7abafec0a3ba8ff82c91acdcb9140e9f --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682758913.nid007026.13891.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:54f58592c7c372e123b2d98504517a1ca91451e473e81966905861027ec812c6 +size 414881 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682760245.nid007222.127646.0 b/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682760245.nid007222.127646.0 new file mode 100644 index 0000000000000000000000000000000000000000..7f8a688ea1e16818580a102a196a32831d52ee8a --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682760245.nid007222.127646.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:52f44d26ba9280fd8b97cc7ad67654ab78003bab265c5ce4e85e07a49e7fde82 +size 112350514 diff --git a/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682952732.nid006757.43241.0 b/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682952732.nid006757.43241.0 new file mode 100644 index 0000000000000000000000000000000000000000..431938771353847796561700887402454473dd52 --- /dev/null +++ b/tensorboard/tensorboard_4b284b1b9c4seed4/events.out.tfevents.1682952732.nid006757.43241.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:befa56197bf2d59d4ed384032a64604bf97eb8e1c7cd9870292f28e7af6f30f4 +size 36156580 diff --git a/tensorboard/tensorboard_4b284b6bc4seed1/events.out.tfevents.1682629657.nid005414.50396.0 b/tensorboard/tensorboard_4b284b6bc4seed1/events.out.tfevents.1682629657.nid005414.50396.0 new file mode 100644 index 0000000000000000000000000000000000000000..0a7776ad83eec7416acdd856a011f69bb900955e --- /dev/null +++ b/tensorboard/tensorboard_4b284b6bc4seed1/events.out.tfevents.1682629657.nid005414.50396.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:a104ed9deb8c9dc2d09e806f23f3e002de8449065475dbd4a88dc78f066c1036 +size 111012075 diff --git a/tensorboard/tensorboard_4b284b6bc4seed1/events.out.tfevents.1682800596.nid005845.92799.0 b/tensorboard/tensorboard_4b284b6bc4seed1/events.out.tfevents.1682800596.nid005845.92799.0 new file mode 100644 index 0000000000000000000000000000000000000000..ab3d916c873033da565d41bc5863c42ba428a210 --- /dev/null +++ b/tensorboard/tensorboard_4b284b6bc4seed1/events.out.tfevents.1682800596.nid005845.92799.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:8b75f91b559279c0b4dd66c9ae371b949e81502c229e6375e142f0d029fa711e +size 36156575 diff --git a/tensorboard/tensorboard_4b284b6bc4seed2/events.out.tfevents.1682629657.nid005588.112259.0 b/tensorboard/tensorboard_4b284b6bc4seed2/events.out.tfevents.1682629657.nid005588.112259.0 new file mode 100644 index 0000000000000000000000000000000000000000..7dff42b9cc2943c9e54a43a9686daf84240eb9a1 --- /dev/null +++ b/tensorboard/tensorboard_4b284b6bc4seed2/events.out.tfevents.1682629657.nid005588.112259.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1fa58c2bb66ae1d519ec2f175d3bf6cf3506a5083392c7d34296fe867afc24f7 +size 111786700 diff --git a/tensorboard/tensorboard_4b284b6bc4seed2/events.out.tfevents.1682800596.nid006443.92648.0 b/tensorboard/tensorboard_4b284b6bc4seed2/events.out.tfevents.1682800596.nid006443.92648.0 new file mode 100644 index 0000000000000000000000000000000000000000..0991ec80ea020bc8fa2a951295496b05113790ca --- /dev/null +++ b/tensorboard/tensorboard_4b284b6bc4seed2/events.out.tfevents.1682800596.nid006443.92648.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:1cc12921de68ee9e1398dd28722747fcb02b77dee8a9a2355fef9d4ea49a5cc5 +size 36156575 diff --git a/tensorboard/tensorboard_4b284b6bc4seed3/events.out.tfevents.1682629657.nid006841.111647.0 b/tensorboard/tensorboard_4b284b6bc4seed3/events.out.tfevents.1682629657.nid006841.111647.0 new file mode 100644 index 0000000000000000000000000000000000000000..68801bc799e9b7ee058803ed45d420f1bd1b109c --- /dev/null +++ b/tensorboard/tensorboard_4b284b6bc4seed3/events.out.tfevents.1682629657.nid006841.111647.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:06ee0e8b5c522f7d0d029d888a8810ca1760ca9134f89a82cae034a7c7969bdb +size 111099758 diff --git a/tensorboard/tensorboard_4b284b6bc4seed3/events.out.tfevents.1682800596.nid005714.129765.0 b/tensorboard/tensorboard_4b284b6bc4seed3/events.out.tfevents.1682800596.nid005714.129765.0 new file mode 100644 index 0000000000000000000000000000000000000000..1ff4f4017f456249a66fd7a3202ac4fcaffd1c7a --- /dev/null +++ b/tensorboard/tensorboard_4b284b6bc4seed3/events.out.tfevents.1682800596.nid005714.129765.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:03985923c125817490eb985e5700e0d8ea6443a5b3501255960bfd9c308a1209 +size 36156575 diff --git a/tensorboard/tensorboard_4b284b6bc4seed4/events.out.tfevents.1682629657.nid006970.43197.0 b/tensorboard/tensorboard_4b284b6bc4seed4/events.out.tfevents.1682629657.nid006970.43197.0 new file mode 100644 index 0000000000000000000000000000000000000000..e3095a7c63baa6b6e802450e4a60e06bb543e066 --- /dev/null +++ b/tensorboard/tensorboard_4b284b6bc4seed4/events.out.tfevents.1682629657.nid006970.43197.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:08d9ead7d6d8e1112b61a5ce532bd938dcdf44ed244a513c7dc80aae5f7591c4 +size 111203898 diff --git a/tensorboard/tensorboard_4b284b6bc4seed4/events.out.tfevents.1682800596.nid006361.36597.0 b/tensorboard/tensorboard_4b284b6bc4seed4/events.out.tfevents.1682800596.nid006361.36597.0 new file mode 100644 index 0000000000000000000000000000000000000000..57ba24037aa61e40aad9be2ced36d56208900f81 --- /dev/null +++ b/tensorboard/tensorboard_4b284b6bc4seed4/events.out.tfevents.1682800596.nid006361.36597.0 @@ -0,0 +1,3 @@ +version https://git-lfs.github.com/spec/v1 +oid sha256:5da3e1ee6629756c870c2161e43cae78a487c806c9eb7aa9d89f696d697918e6 +size 36156575